diff --git a/annotations_filtered/u-2jqTXKQyU_filtered.json b/annotations_filtered/u-2jqTXKQyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8fee8356651b61603daba1d49e94b7f0ac8b35a --- /dev/null +++ b/annotations_filtered/u-2jqTXKQyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.7], [7.0, 7.57], [12.0, 13.98], [15.0, 16.61], [19.0, 20.38], [22.0, 22.49], [27.0, 27.57], [29.0, 29.96], [36.0, 36.83], [44.0, 44.51], [45.0, 45.94], [48.0, 48.44], [54.0, 54.87], [62.0, 62.77], [64.0, 64.61], [83.0, 99.84], [101.0, 102.03], [103.0, 104.09], [106.0, 107.2], [110.0, 110.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 0.57, 1.98, 1.61, 1.38, 0.49, 0.57, 0.96, 0.83, 0.51, 0.94, 0.44, 0.87, 0.77, 0.61, 16.84, 1.03, 1.09, 1.2, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/u-ApxFOpl28_filtered.json b/annotations_filtered/u-ApxFOpl28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..439c3cfddacd0a5d3f6c61a20b17c4b9a88870c5 --- /dev/null +++ b/annotations_filtered/u-ApxFOpl28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 41.62], [42.0, 44.37], [45.0, 48.56], [50.0, 58.8]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 31.28, 29.78, 32.1], "audiomae_on_audioset": [null, [["music", 32.65], ["mains hum", 16.54], ["hum", 10.62]], [["speech", 63.14], ["explosion", 6.11], ["eruption", 4.38]], [["mains hum", 48.7], ["hum", 39.79], ["music", 4.65]]], "duration": [37.62, 2.37, 3.56, 8.8]} \ No newline at end of file diff --git a/annotations_filtered/u-BIr0fW5cU_filtered.json b/annotations_filtered/u-BIr0fW5cU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..951e568d91d06a427c366b3da84d87174f73ea21 --- /dev/null +++ b/annotations_filtered/u-BIr0fW5cU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.95], [23.0, 26.2], [27.0, 30.86], [32.0, 39.16], [40.0, 50.95], [51.0, 51.02], [52.0, 51.95], [52.0, 56.66], [58.0, 72.79], [77.0, 77.23], [80.0, 81.4], [82.0, 83.42], [85.0, 85.62], [87.0, 87.72], [89.0, 94.88], [100.0, 101.16], [103.0, 106.81], [108.0, 111.25], [116.0, 122.89], [125.0, 128.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [100.0, 100.0, 99.98, 98.51, 84.62, 0.0, 0.0, 38.94, 34.99, 0.0, 0.0, 0.0, 0.0, 0.0, 38.7, 0.0, 34.46, 42.88, 55.67, 75.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 73.96], ["musical instrument", 2.79], ["hum", 2.52]], [["music", 60.68], ["synthesizer", 6.87], ["chop", 5.16]], null, null, null, null, null, [["music", 54.19], ["musical instrument", 4.57], ["hum", 3.91]], null, [["speech", 40.49], ["music", 15.34], ["hum", 8.4]], [["music", 46.48], ["hum", 6.28], ["didgeridoo", 5.74]], null, null], "duration": [2.95, 3.2, 3.86, 7.16, 10.95, 0.02, -0.05, 4.66, 14.79, 0.23, 1.4, 1.42, 0.62, 0.72, 5.88, 1.16, 3.81, 3.25, 6.89, 3.61]} \ No newline at end of file diff --git a/annotations_filtered/u-M2Zb_B7BY_filtered.json b/annotations_filtered/u-M2Zb_B7BY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c79f2f8a1617cb9d7903f032c692630828f05492 --- /dev/null +++ b/annotations_filtered/u-M2Zb_B7BY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.62], [22.0, 28.29], [31.0, 31.94], [43.0, 47.61], [52.0, 58.94], [61.0, 61.03], [66.0, 76.52], [77.0, 81.23]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [70.58, 63.42, 0.0, 33.93, 34.86, 0.0, 48.95, 49.45], "audiomae_on_audioset": [null, null, null, [["music", 50.74], ["hum", 14.7], ["mains hum", 6.6]], [["hum", 47.23], ["music", 19.3], ["mains hum", 12.41]], null, [["music", 70.57], ["didgeridoo", 15.75], ["musical instrument", 3.01]], [["music", 21.77], ["hum", 21.63], ["mains hum", 15.53]]], "duration": [3.62, 6.29, 0.94, 4.61, 6.94, 0.03, 10.52, 4.23]} \ No newline at end of file diff --git a/annotations_filtered/u-bWIkGa0QA_filtered.json b/annotations_filtered/u-bWIkGa0QA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f997176b34a50b7343c1926cc48f66c056ec3389 --- /dev/null +++ b/annotations_filtered/u-bWIkGa0QA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.96], [20.0, 23.77], [33.0, 33.37], [34.0, 34.55], [35.0, 36.14], [46.0, 46.23], [59.0, 59.32], [59.0, 59.39], [59.0, 59.43], [59.0, 59.49], [77.0, 80.96], [88.0, 92.37], [101.0, 105.51], [110.0, 111.84], [116.0, 122.25], [123.0, 122.61], [123.0, 123.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.61, 30.93, 31.56, 0.0, 32.73, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.69], ["music", 14.86], ["beatboxing", 7.82]], null, null, null, null, null, null, null, null, [["speech", 36.71], ["noise", 14.62], ["groan", 8.51]], [["speech", 53.76], ["electric shaver, electric razor", 4.65], ["whimper", 4.19]], [["cattle, bovinae", 43.67], ["moo", 32.31], ["speech", 11.13]], null, [["speech", 41.73], ["noise", 12.29], ["radio", 9.51]], null, null], "duration": [1.96, 3.77, 0.37, 0.55, 1.14, 0.23, 0.32, 0.39, 0.43, 0.49, 3.96, 4.37, 4.51, 1.84, 6.25, -0.39, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/u-eTCyG0jpA_filtered.json b/annotations_filtered/u-eTCyG0jpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0377effd39d23a189c4c16cf06698f33d64224ab --- /dev/null +++ b/annotations_filtered/u-eTCyG0jpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [16.0, 17.95], [27.0, 27.57], [34.0, 36.48], [37.0, 37.79], [40.0, 49.72], [70.0, 77.72], [82.0, 84.67], [85.0, 88.01], [90.0, 95.5], [98.0, 103.05], [106.0, 114.22], [116.0, 116.01], [126.0, 136.0], [144.0, 150.5], [165.0, 166.78], [169.0, 170.07]], "keep_status": [false, false, false, false, false, true, true, false, true, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.82, 0.0, 35.54, 29.5, 36.34, 33.77, 29.79, 29.37, 29.07, 0.0, 29.75, 30.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 51.76], ["theremin", 27.78], ["cacophony", 2.98]], null, [["music", 28.49], ["fly, housefly", 21.12], ["insect", 7.26]], [["music", 22.03], ["fart", 13.49], ["speech", 12.4]], [["speech", 40.22], ["music", 28.55], ["throbbing", 10.59]], [["music", 37.77], ["hum", 9.76], ["throbbing", 8.43]], [["music", 22.53], ["whack, thwack", 18.31], ["speech", 9.88]], [["speech", 19.04], ["music", 14.61], ["outside, rural or natural", 6.32]], [["livestock, farm animals, working animals", 25.47], ["moo", 21.82], ["cattle, bovinae", 21.65]], null, [["speech", 52.85], ["music", 9.4], ["outside, rural or natural", 3.59]], [["music", 21.33], ["moo", 20.45], ["livestock, farm animals, working animals", 16.94]], null, null], "duration": [0.58, 1.95, 0.57, 2.48, 0.79, 9.72, 7.72, 2.67, 3.01, 5.5, 5.05, 8.22, 0.01, 10.0, 6.5, 1.78, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/u-pvs7gVNHo_filtered.json b/annotations_filtered/u-pvs7gVNHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dab2c3e47f5a488ed6526cbaf048bc5289a0814a --- /dev/null +++ b/annotations_filtered/u-pvs7gVNHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [7.0, 40.14], [41.0, 43.02], [43.0, 46.6], [48.0, 48.19], [54.0, 54.87], [56.0, 59.64], [62.0, 62.94], [65.0, 68.52], [69.0, 70.77], [72.0, 71.76], [72.0, 97.6], [98.0, 98.58], [99.0, 110.02], [113.0, 123.9], [126.0, 143.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 62.07, 67.89, 0.0, 0.0, 58.55, 0.0, 91.64, 0.0, 0.0, 42.76, 0.0, 38.33, 28.28, 37.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.02], ["mains hum", 40.73], ["speech", 3.89]], null, [["rumble", 36.86], ["speech", 18.92], ["hum", 17.48]], [["explosion", 21.57], ["music", 11.17], ["hum", 9.69]], [["hum", 32.01], ["throbbing", 16.66], ["speech", 10.28]]], "duration": [0.33, 33.14, 2.02, 3.6, 0.19, 0.87, 3.64, 0.94, 3.52, 1.77, -0.24, 25.6, 0.58, 11.02, 10.9, 17.6]} \ No newline at end of file diff --git a/annotations_filtered/u-z5139CW1I_filtered.json b/annotations_filtered/u-z5139CW1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e502d192daa56a1a059956358b76badeed05828a --- /dev/null +++ b/annotations_filtered/u-z5139CW1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.26], [9.0, 11.55], [18.0, 22.49], [27.0, 33.47], [34.0, 36.73], [37.0, 36.95], [37.0, 36.98], [37.0, 37.02], [37.0, 45.91], [47.0, 49.47], [63.0, 73.62], [75.0, 92.37], [93.0, 117.49], [118.0, 117.75]], "keep_status": [false, true, true, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [49.73, 34.37, 31.65, 32.17, 32.04, 0.0, 0.0, 0.0, 30.85, 31.37, 37.27, 31.65, 91.47, 0.0], "audiomae_on_audioset": [[["fly, housefly", 51.91], ["insect", 23.96], ["mosquito", 13.88]], [["music", 22.27], ["speech", 16.26], ["sonar", 8.91]], [["throbbing", 32.32], ["hum", 28.1], ["mains hum", 7.11]], [["speech", 64.77], ["music", 10.58], ["whack, thwack", 3.99]], [["sidetone", 28.28], ["whack, thwack", 19.62], ["music", 6.65]], null, null, null, [["speech", 68.8], ["music", 4.84], ["sound effect", 2.9]], [["music", 24.1], ["whale vocalization", 21.71], ["synthesizer", 6.56]], [["bee, wasp, etc.", 22.09], ["fly, housefly", 20.42], ["insect", 19.0]], [["fly, housefly", 51.59], ["insect", 18.3], ["mosquito", 14.4]], null, null], "duration": [5.26, 2.55, 4.49, 6.47, 2.73, -0.05, -0.02, 0.02, 8.91, 2.47, 10.62, 17.37, 24.49, -0.25]} \ No newline at end of file diff --git a/annotations_filtered/u0RqfETo2ok_filtered.json b/annotations_filtered/u0RqfETo2ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afccd196d8d2cdcb81e6fdd04060f402adb0eb4c --- /dev/null +++ b/annotations_filtered/u0RqfETo2ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.75], [13.0, 13.68], [17.0, 17.22], [19.0, 23.23], [26.0, 26.97], [36.0, 42.11], [44.0, 46.77], [51.0, 51.26], [53.0, 53.6], [59.0, 59.8], [61.0, 61.45], [63.0, 64.47], [67.0, 67.49], [69.0, 69.62], [80.0, 80.82], [90.0, 91.22], [104.0, 106.17], [112.0, 114.32]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 30.13, 0.0, 28.42, 29.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.32, 32.79], "audiomae_on_audioset": [null, null, null, [["speech", 45.76], ["music", 25.83], ["didgeridoo", 4.77]], null, [["speech", 55.85], ["music", 7.03], ["throbbing", 4.83]], [["speech", 49.02], ["crowd", 7.65], ["cheering", 6.03]], null, null, null, null, null, null, null, null, null, [["theremin", 31.45], ["whale vocalization", 20.98], ["music", 15.3]], [["music", 32.63], ["didgeridoo", 5.71], ["gong", 5.69]]], "duration": [1.75, 0.68, 0.22, 4.23, 0.97, 6.11, 2.77, 0.26, 0.6, 0.8, 0.45, 1.47, 0.49, 0.62, 0.82, 1.22, 2.17, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/u0fi902X3qo_filtered.json b/annotations_filtered/u0fi902X3qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfffa83bb1f7282a8064b47c87f55c219019094b --- /dev/null +++ b/annotations_filtered/u0fi902X3qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.16], [16.0, 16.85], [18.0, 20.75], [22.0, 22.62], [24.0, 35.77], [37.0, 38.47], [39.0, 40.22], [41.0, 47.22], [48.0, 63.96], [65.0, 77.89], [79.0, 83.98], [85.0, 86.51], [88.0, 89.68], [90.0, 92.53], [94.0, 94.32], [99.0, 101.82], [103.0, 137.13], [139.0, 141.32], [142.0, 144.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.94, 0.0, 99.93, 0.0, 0.0, 99.97, 96.54, 72.6, 66.76, 0.0, 0.0, 60.05, 0.0, 60.98, 0.0, 78.04, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.85, 2.75, 0.62, 11.77, 1.47, 1.22, 6.22, 15.96, 12.89, 4.98, 1.51, 1.68, 2.53, 0.32, 2.82, 34.13, 2.32, 2.31]} \ No newline at end of file diff --git a/annotations_filtered/u0kF24ceZMI_filtered.json b/annotations_filtered/u0kF24ceZMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12d701616616013e1880bbccda7a1eccf4a5c851 --- /dev/null +++ b/annotations_filtered/u0kF24ceZMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.04], [13.0, 13.73], [20.0, 25.49], [27.0, 33.99], [47.0, 51.39], [52.0, 53.72], [55.0, 55.29], [57.0, 57.79], [59.0, 59.81], [61.0, 61.53], [64.0, 64.72], [69.0, 69.62], [78.0, 78.17], [82.0, 83.05], [84.0, 83.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.94, 0.0, 32.01, 31.14, 31.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.36], ["speech", 5.02], ["crowd", 5.01]], null, [["music", 52.35], ["crowd", 9.85], ["speech", 7.67]], [["moo", 29.14], ["music", 20.63], ["cattle, bovinae", 20.47]], [["music", 67.7], ["speech", 3.51], ["crowd", 2.66]], null, null, null, null, null, null, null, null, null, null], "duration": [3.04, 0.73, 5.49, 6.99, 4.39, 1.72, 0.29, 0.79, 0.81, 0.53, 0.72, 0.62, 0.17, 1.05, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/u0ttQ8Dn7LM_filtered.json b/annotations_filtered/u0ttQ8Dn7LM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec0019e6ece553614eac27718e86bd097a5325b8 --- /dev/null +++ b/annotations_filtered/u0ttQ8Dn7LM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.36], [16.0, 17.22], [20.0, 20.19], [21.0, 21.93], [24.0, 24.09], [24.0, 31.68], [33.0, 42.16], [47.0, 46.87], [47.0, 52.57], [55.0, 68.96], [72.0, 74.65], [76.0, 80.03], [83.0, 83.71], [87.0, 89.41], [91.0, 93.09], [94.0, 96.5], [99.0, 100.08], [102.0, 103.1], [105.0, 107.49], [108.0, 110.13], [112.0, 113.31], [116.0, 117.85], [119.0, 120.77], [122.0, 130.28], [131.0, 139.6], [142.0, 151.5], [152.0, 154.92], [160.0, 162.33], [163.0, 164.4], [165.0, 165.52], [168.0, 168.51], [170.0, 170.75], [171.0, 171.8], [173.0, 173.01], [177.0, 177.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.84, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 100.0, 99.94, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.36, 1.22, 0.19, 0.93, 0.09, 7.68, 9.16, -0.13, 5.57, 13.96, 2.65, 4.03, 0.71, 2.41, 2.09, 2.5, 1.08, 1.1, 2.49, 2.13, 1.31, 1.85, 1.77, 8.28, 8.6, 9.5, 2.92, 2.33, 1.4, 0.52, 0.51, 0.75, 0.8, 0.01, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/u0wNMcfOIXM_filtered.json b/annotations_filtered/u0wNMcfOIXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcaca3850dd0fab8c7b9c3a49a5947cecfd9a411 --- /dev/null +++ b/annotations_filtered/u0wNMcfOIXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.25], [16.0, 16.33], [18.0, 18.42], [25.0, 24.63], [28.0, 27.85], [29.0, 30.15], [34.0, 34.08], [37.0, 39.61], [42.0, 47.34], [48.0, 48.46], [49.0, 57.7], [59.0, 60.15], [61.0, 61.5], [67.0, 68.49], [69.0, 73.2], [76.0, 77.87], [81.0, 82.44], [84.0, 87.39]], "keep_status": [true, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, true], "silence_prob": [40.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.02, 34.77, 0.0, 37.43, 0.0, 0.0, 0.0, 36.77, 0.0, 0.0, 31.15], "audiomae_on_audioset": [[["music", 29.79], ["clip-clop", 11.99], ["horse", 9.65]], null, null, null, null, null, null, [["music", 35.07], ["coin (dropping)", 6.91], ["radio", 3.53]], [["music", 55.15], ["synthesizer", 5.76], ["effects unit", 4.94]], null, [["music", 36.39], ["echo", 15.64], ["effects unit", 8.86]], null, null, null, [["music", 49.13], ["throbbing", 12.15], ["hum", 8.81]], null, null, [["fart", 46.21], ["whir", 4.91], ["effects unit", 3.14]]], "duration": [8.25, 0.33, 0.42, -0.37, -0.15, 1.15, 0.08, 2.61, 5.34, 0.46, 8.7, 1.15, 0.5, 1.49, 4.2, 1.87, 1.44, 3.39]} \ No newline at end of file diff --git a/annotations_filtered/u17vCX9koaI_filtered.json b/annotations_filtered/u17vCX9koaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc6c6452f278ed18332a660be37354b355fd820d --- /dev/null +++ b/annotations_filtered/u17vCX9koaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [9.0, 9.26], [15.0, 15.25]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.59, 0.26, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/u1MRGbWEI9M_filtered.json b/annotations_filtered/u1MRGbWEI9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b3f7cd51b88eda055f0a684893fd088cc488cc3 --- /dev/null +++ b/annotations_filtered/u1MRGbWEI9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [11.0, 20.09], [21.0, 22.5], [23.0, 24.16], [25.0, 25.64], [27.0, 29.2], [30.0, 31.19], [33.0, 37.0], [38.0, 40.29], [41.0, 81.24], [83.0, 119.58], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [76.37, 98.99, 0.0, 0.0, 0.0, 99.99, 0.0, 82.07, 45.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 49.66], ["burping, eructation", 11.09], ["wail, moan", 6.49]], null, null, null], "duration": [3.76, 9.09, 1.5, 1.16, 0.64, 2.2, 1.19, 4.0, 2.29, 40.24, 36.58, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/u1Pgftn5H94_filtered.json b/annotations_filtered/u1Pgftn5H94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0195920022cfd27933c32f1d33fc9a82ab540414 --- /dev/null +++ b/annotations_filtered/u1Pgftn5H94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.95], [17.0, 19.18], [25.0, 25.34], [31.0, 46.5], [49.0, 53.91], [62.0, 62.68], [64.0, 68.34], [71.0, 75.51], [86.0, 87.02], [88.0, 88.97], [96.0, 96.77], [97.0, 111.92], [115.0, 119.99], [121.0, 121.44], [122.0, 128.11], [130.0, 131.5], [140.0, 141.0], [149.0, 151.7], [157.0, 156.76]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 99.84, 0.0, 44.2, 47.01, 0.0, 57.25, 30.54, 0.0, 0.0, 0.0, 32.42, 35.95, 0.0, 37.51, 0.0, 0.0, 32.42, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.43], ["speech", 15.9], ["outside, rural or natural", 2.28]], [["music", 37.96], ["hum", 12.44], ["throbbing", 9.18]], null, null, [["speech", 67.55], ["hum", 7.26], ["rumble", 4.96]], null, null, null, [["music", 26.36], ["speech", 19.75], ["honk", 13.4]], [["music", 45.37], ["speech", 17.13], ["musical instrument", 4.29]], null, [["music", 58.19], ["double bass", 5.6], ["cello", 4.1]], null, null, [["music", 44.64], ["fart", 9.63], ["fly, housefly", 5.25]], null], "duration": [0.95, 2.18, 0.34, 15.5, 4.91, 0.68, 4.34, 4.51, 1.02, 0.97, 0.77, 14.92, 4.99, 0.44, 6.11, 1.5, 1.0, 2.7, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/u1QIbENq66w_filtered.json b/annotations_filtered/u1QIbENq66w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0b783af41fe22b0c4232da04391e9f852141c83 --- /dev/null +++ b/annotations_filtered/u1QIbENq66w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 75.15], [75.0, 76.6], [79.0, 97.83]], "keep_status": [false, false, true], "silence_prob": [33.02, 0.0, 31.66], "audiomae_on_audioset": [[["boing", 78.03], ["music", 8.06], ["fly, housefly", 2.27]], null, [["boing", 46.23], ["music", 15.22], ["frog", 6.09]]], "duration": [7.15, 1.6, 18.83]} \ No newline at end of file diff --git a/annotations_filtered/u1pJJOaKdiQ_filtered.json b/annotations_filtered/u1pJJOaKdiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51c0e6f9ef30756c10a988407a0446dff2eafd82 --- /dev/null +++ b/annotations_filtered/u1pJJOaKdiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.93], [23.0, 23.72], [24.0, 25.15], [28.0, 29.61], [31.0, 32.27], [33.0, 34.15], [43.0, 43.06], [51.0, 53.65], [55.0, 57.52], [58.0, 58.82], [60.0, 61.11], [62.0, 63.37], [64.0, 65.79], [66.0, 66.88], [67.0, 68.55], [69.0, 70.29], [71.0, 72.05], [74.0, 83.81], [90.0, 91.77], [95.0, 97.63], [100.0, 101.26], [102.0, 102.49], [103.0, 104.11], [106.0, 106.34], [108.0, 109.24], [111.0, 110.73], [118.0, 118.4], [120.0, 119.94], [121.0, 120.77], [122.0, 125.46], [126.0, 125.73], [127.0, 127.43], [128.0, 131.5], [134.0, 134.97], [139.0, 139.4], [140.0, 140.41], [142.0, 143.46], [145.0, 145.42], [147.0, 148.47], [150.0, 150.38], [151.0, 151.43]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 43.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 20.37], ["radio", 18.24], ["horse", 4.48]], null, null, null, null, null, null, [["speech", 37.34], ["radio", 6.11], ["creak", 4.72]], [["frog", 17.3], ["whack, thwack", 13.75], ["radio", 6.29]], null, null, null, null, null, null, null, null, [["insect", 19.98], ["fly, housefly", 16.41], ["radio", 13.11]], null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 13.68], ["insect", 6.24], ["animal", 6.2]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.93, 0.72, 1.15, 1.61, 1.27, 1.15, 0.06, 2.65, 2.52, 0.82, 1.11, 1.37, 1.79, 0.88, 1.55, 1.29, 1.05, 9.81, 1.77, 2.63, 1.26, 0.49, 1.11, 0.34, 1.24, -0.27, 0.4, -0.06, -0.23, 3.46, -0.27, 0.43, 3.5, 0.97, 0.4, 0.41, 1.46, 0.42, 1.47, 0.38, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/u2107BTcDbs_filtered.json b/annotations_filtered/u2107BTcDbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad957abb429978fecbcda707e2b7f67fce45940 --- /dev/null +++ b/annotations_filtered/u2107BTcDbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 39.18], [40.0, 40.96], [43.0, 43.01], [44.0, 44.78], [46.0, 62.8], [69.0, 71.47], [74.0, 91.32], [92.0, 92.4], [94.0, 94.66], [97.0, 97.26], [104.0, 105.12], [112.0, 113.53], [115.0, 116.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.38, 0.0, 0.0, 0.0, 57.17, 75.72, 49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 73.47], ["speech", 8.23], ["music for children", 1.84]], null, null, null, null, null, null], "duration": [2.18, 0.96, 0.01, 0.78, 16.8, 2.47, 17.32, 0.4, 0.66, 0.26, 1.12, 1.53, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/u2D0kDFKaxE_filtered.json b/annotations_filtered/u2D0kDFKaxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e633ca51214dc830da8488424fb0eac7124d6a9b --- /dev/null +++ b/annotations_filtered/u2D0kDFKaxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.28], [10.0, 10.94], [13.0, 14.76], [17.0, 17.98], [24.0, 24.73], [34.0, 35.26], [36.0, 37.62], [39.0, 50.19], [60.0, 60.93], [98.0, 100.8], [101.0, 100.84], [101.0, 100.87], [112.0, 118.44], [125.0, 131.62], [140.0, 140.8], [151.0, 150.7], [151.0, 153.99], [159.0, 165.75], [170.0, 175.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 31.1, 0.0, 0.0, 31.34, 30.45, 0.0, 0.0, 29.95, 30.32, 30.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 53.16], ["didgeridoo", 15.84], ["synthesizer", 9.19]], null, null, [["music", 79.88], ["electronic music", 3.96], ["synthesizer", 3.7]], [["music", 53.99], ["throbbing", 7.97], ["hum", 7.67]], null, null, [["speech", 30.94], ["mains hum", 17.39], ["hum", 15.32]], [["music", 67.13], ["trance music", 11.16], ["electronic music", 7.88]], [["music", 66.18], ["synthesizer", 8.23], ["electronic music", 6.18]]], "duration": [1.28, 0.94, 1.76, 0.98, 0.73, 1.26, 1.62, 11.19, 0.93, 2.8, -0.16, -0.13, 6.44, 6.62, 0.8, -0.3, 2.99, 6.75, 5.39]} \ No newline at end of file diff --git a/annotations_filtered/u2pu0m9iTo4_filtered.json b/annotations_filtered/u2pu0m9iTo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36bf91d1726c446c6f8e0bb4bf79a2daf780a024 --- /dev/null +++ b/annotations_filtered/u2pu0m9iTo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.21], [45.0, 48.93], [50.0, 52.79], [54.0, 54.92], [56.0, 57.7], [59.0, 62.21], [64.0, 64.42], [66.0, 66.53], [67.0, 68.25], [69.0, 76.84], [77.0, 78.22], [84.0, 107.45], [109.0, 108.89], [109.0, 109.17], [110.0, 110.17], [110.0, 113.19]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 49.31, 37.41, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0, 33.53, 0.0, 36.21, 0.0, 0.0, 0.0, 31.3], "audiomae_on_audioset": [null, [["music", 76.12], ["didgeridoo", 3.63], ["musical instrument", 2.05]], [["cattle, bovinae", 32.25], ["moo", 25.43], ["music", 13.31]], null, null, [["music", 28.9], ["speech", 12.82], ["foghorn", 10.52]], null, null, null, [["wail, moan", 42.1], ["speech", 7.7], ["grunt", 4.76]], null, [["music", 38.72], ["fly, housefly", 19.53], ["insect", 7.59]], null, null, null, [["music", 48.27], ["theremin", 12.84], ["musical instrument", 7.46]]], "duration": [1.21, 3.93, 2.79, 0.92, 1.7, 3.21, 0.42, 0.53, 1.25, 7.84, 1.22, 23.45, -0.11, 0.17, 0.17, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/u3UyGrnv1-A_filtered.json b/annotations_filtered/u3UyGrnv1-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a2f63544cadcaea4d318eedb42c879430d3fa4e --- /dev/null +++ b/annotations_filtered/u3UyGrnv1-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.67], [10.0, 9.76], [11.0, 12.26], [14.0, 13.64], [18.0, 18.81], [19.0, 20.56], [26.0, 26.33], [28.0, 28.71], [34.0, 39.34], [42.0, 42.69], [46.0, 45.91], [52.0, 60.0], [60.0, 67.07], [67.0, 69.15], [70.0, 71.76], [73.0, 73.3], [76.0, 78.09], [80.0, 80.76], [84.0, 89.11], [93.0, 95.23], [98.0, 98.29], [101.0, 105.6], [108.0, 111.27], [116.0, 116.5], [117.0, 117.68], [121.0, 121.54], [122.0, 122.15], [126.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.49, 0.0, 0.0, 57.01, 88.46, 60.42, 0.0, 0.0, 40.02, 0.0, 43.61, 43.53, 0.0, 36.41, 37.93, 0.0, 0.0, 0.0, 0.0, 29.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 65.42], ["speech", 5.57], ["musical instrument", 4.25]], null, null, null, null, null, null, null, [["speech", 58.65], ["glass", 3.97], ["dishes, pots, and pans", 3.96]], null, [["speech", 73.07], ["fart", 3.93], ["music", 2.42]], [["music", 24.47], ["thunk", 10.77], ["fart", 7.74]], null, [["thunk", 52.9], ["whack, thwack", 8.02], ["breaking", 4.6]], [["livestock, farm animals, working animals", 10.33], ["music", 9.51], ["moo", 5.55]], null, null, null, null, [["machine gun", 76.57], ["speech", 9.89], ["gunshot, gunfire", 5.9]]], "duration": [-0.33, -0.24, 1.26, -0.36, 0.81, 1.56, 0.33, 0.71, 5.34, 0.69, -0.09, 8.0, 7.07, 2.15, 1.76, 0.3, 2.09, 0.76, 5.11, 2.23, 0.29, 4.6, 3.27, 0.5, 0.68, 0.54, 0.15, 5.94]} \ No newline at end of file diff --git a/annotations_filtered/u3XXKF0oDtU_filtered.json b/annotations_filtered/u3XXKF0oDtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17d7c788b9a867541883a043b26a5d0bbd6d139e --- /dev/null +++ b/annotations_filtered/u3XXKF0oDtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [4.0, 5.17], [8.0, 11.03], [13.0, 13.2], [17.0, 19.36], [23.0, 23.4], [25.0, 48.61], [50.0, 50.38], [52.0, 68.4], [74.0, 93.51], [95.0, 103.17], [103.0, 105.16], [106.0, 123.65], [124.0, 130.0], [132.0, 135.9], [138.0, 139.9], [142.0, 143.8], [145.0, 149.34]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 49.22, 0.0, 68.02, 0.0, 72.9, 0.0, 37.15, 36.92, 35.22, 33.32, 30.15, 31.91, 30.87, 0.0, 0.0, 35.73], "audiomae_on_audioset": [null, null, [["speech", 26.68], ["music", 25.2], ["hum", 3.8]], null, null, null, null, null, [["music", 61.26], ["theremin", 18.82], ["speech", 7.23]], [["music", 90.87], ["throbbing", 1.74], ["electronic music", 0.84]], [["music", 33.04], ["theremin", 28.57], ["synthesizer", 5.36]], [["music", 33.0], ["quack", 32.62], ["duck", 4.57]], [["music", 32.08], ["sound effect", 7.35], ["whoosh, swoosh, swish", 5.62]], [["speech", 61.12], ["music", 13.34], ["didgeridoo", 2.16]], [["music", 51.29], ["explosion", 15.63], ["burst, pop", 3.54]], null, null, [["mains hum", 33.4], ["hum", 22.33], ["speech", 12.67]]], "duration": [0.15, 1.17, 3.03, 0.2, 2.36, 0.4, 23.61, 0.38, 16.4, 19.51, 8.17, 2.16, 17.65, 6.0, 3.9, 1.9, 1.8, 4.34]} \ No newline at end of file diff --git a/annotations_filtered/u3_3EUKbY00_filtered.json b/annotations_filtered/u3_3EUKbY00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cba9f9aeb12eaa7c64a083ad961a949fac53c16 --- /dev/null +++ b/annotations_filtered/u3_3EUKbY00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [6.0, 6.59], [8.0, 10.52], [28.0, 29.51], [38.0, 39.88], [42.0, 48.79], [49.0, 50.6], [51.0, 61.43], [62.0, 63.17], [65.0, 67.86], [68.0, 70.75], [71.0, 84.89], [86.0, 89.26], [93.0, 93.51], [96.0, 101.46], [103.0, 104.68], [107.0, 115.08], [117.0, 117.63], [120.0, 121.42], [123.0, 125.81], [127.0, 128.16], [130.0, 129.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.71, 0.0, 0.0, 93.29, 0.0, 99.44, 0.0, 99.73, 94.37, 99.44, 97.92, 0.0, 98.44, 0.0, 94.95, 0.0, 0.0, 99.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.59, 2.52, 1.51, 1.88, 6.79, 1.6, 10.43, 1.17, 2.86, 2.75, 13.89, 3.26, 0.51, 5.46, 1.68, 8.08, 0.63, 1.42, 2.81, 1.16, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/u3mupIlFIYQ_filtered.json b/annotations_filtered/u3mupIlFIYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..205ac0f7a8501379285c60e01230c2504d2c6462 --- /dev/null +++ b/annotations_filtered/u3mupIlFIYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [4.0, 5.17], [6.0, 7.28], [8.0, 9.34], [10.0, 25.83], [26.0, 28.0], [29.0, 30.33], [31.0, 32.85], [35.0, 38.89], [42.0, 42.13], [43.0, 44.81], [45.0, 46.14], [47.0, 83.32], [84.0, 144.93], [146.0, 147.66], [149.0, 152.59], [153.0, 153.89], [154.0, 159.65], [161.0, 160.76], [162.0, 163.04], [166.0, 166.87], [172.0, 173.42], [175.0, 176.47], [178.0, 177.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.09, 35.78, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.22, 0.0, 45.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 71.12], ["sidetone", 6.72], ["busy signal", 5.23]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.16], ["whack, thwack", 11.26], ["crushing", 9.61]], null, null, null, null, null, null], "duration": [0.45, 1.17, 1.28, 1.34, 15.83, 2.0, 1.33, 1.85, 3.89, 0.13, 1.81, 1.14, 36.32, 60.93, 1.66, 3.59, 0.89, 5.65, -0.24, 1.04, 0.87, 1.42, 1.47, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/u3oi4L5tWQg_filtered.json b/annotations_filtered/u3oi4L5tWQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b196a7099123c22fe3ea0a17aa2a73e6a2dc66fc --- /dev/null +++ b/annotations_filtered/u3oi4L5tWQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 48.39], [49.0, 52.35], [53.0, 55.29], [57.0, 58.56], [61.0, 62.11], [64.0, 64.72], [65.0, 65.92], [68.0, 68.82], [78.0, 78.54], [83.0, 84.08], [85.0, 85.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.08, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [31.39, 3.35, 2.29, 1.56, 1.11, 0.72, 0.92, 0.82, 0.54, 1.08, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/u3xIs0aajN4_filtered.json b/annotations_filtered/u3xIs0aajN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6007bb4ec2d7d97e1e78e541823d9d249ec6f80 --- /dev/null +++ b/annotations_filtered/u3xIs0aajN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.45], [19.0, 22.59], [25.0, 38.79], [40.0, 40.42], [42.0, 45.42], [46.0, 46.26], [48.0, 48.59], [50.0, 54.04], [55.0, 55.61], [63.0, 64.17], [71.0, 74.53], [76.0, 76.67], [85.0, 90.04], [94.0, 95.17], [101.0, 101.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [62.58, 95.91, 91.64, 0.0, 76.53, 0.0, 0.0, 87.19, 0.0, 0.0, 48.35, 0.0, 84.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["ping", 11.96], ["music", 8.32], ["synthesizer", 5.47]], null, null, null, null], "duration": [4.45, 3.59, 13.79, 0.42, 3.42, 0.26, 0.59, 4.04, 0.61, 1.17, 3.53, 0.67, 5.04, 1.17, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/u455yxBv35A_filtered.json b/annotations_filtered/u455yxBv35A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f08b241827116ee99070ece328bfd00654b8f0c5 --- /dev/null +++ b/annotations_filtered/u455yxBv35A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [2.0, 6.24], [24.0, 24.56], [26.0, 26.23], [39.0, 43.29], [50.0, 64.25], [68.0, 68.67], [75.0, 75.1], [77.0, 77.58], [78.0, 81.62], [82.0, 92.65], [93.0, 94.19], [101.0, 104.48], [104.0, 104.57], [106.0, 122.61], [124.0, 127.45], [130.0, 137.56], [146.0, 146.75], [149.0, 156.79], [157.0, 158.19], [161.0, 161.92]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.28, 0.0, 0.0, 42.98, 33.23, 0.0, 0.0, 0.0, 35.29, 30.43, 0.0, 30.56, 0.0, 31.97, 33.53, 30.58, 0.0, 31.76, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 35.97], ["music", 26.97], ["hum", 16.15]], null, null, [["music", 46.8], ["speech", 21.33], ["foghorn", 5.68]], [["music", 42.19], ["speech", 15.91], ["musical instrument", 3.02]], null, null, null, [["music", 44.62], ["boing", 20.86], ["theremin", 6.74]], [["music", 76.77], ["sound effect", 2.22], ["hum", 2.0]], null, [["livestock, farm animals, working animals", 40.74], ["cattle, bovinae", 33.28], ["moo", 21.43]], null, [["music", 60.61], ["speech", 11.22], ["buzz", 2.14]], [["music", 45.35], ["theremin", 16.28], ["didgeridoo", 12.37]], [["music", 70.66], ["boing", 2.89], ["cacophony", 2.84]], null, [["music", 25.51], ["speech", 23.47], ["vehicle", 12.48]], null, null], "duration": [0.93, 4.24, 0.56, 0.23, 4.29, 14.25, 0.67, 0.1, 0.58, 3.62, 10.65, 1.19, 3.48, 0.57, 16.61, 3.45, 7.56, 0.75, 7.79, 1.19, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/u4T5X47MKm4_filtered.json b/annotations_filtered/u4T5X47MKm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89183ad40f8aab739419492a5993b81e90375dab --- /dev/null +++ b/annotations_filtered/u4T5X47MKm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.98], [13.0, 14.91], [15.0, 38.18], [39.0, 53.22]], "keep_status": [false, false, true, true], "silence_prob": [53.22, 0.0, 33.24, 30.41], "audiomae_on_audioset": [null, null, [["speech", 29.3], ["hum", 22.63], ["mains hum", 17.21]], [["speech", 39.18], ["music", 11.98], ["livestock, farm animals, working animals", 6.12]]], "duration": [6.98, 1.91, 23.18, 14.22]} \ No newline at end of file diff --git a/annotations_filtered/u4T7slD8Mq4_filtered.json b/annotations_filtered/u4T7slD8Mq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7956dae195576d80fd1dd1338009633c044220b8 --- /dev/null +++ b/annotations_filtered/u4T7slD8Mq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 51.06], [53.0, 83.0], [85.0, 97.24], [98.0, 105.14], [112.0, 122.05]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 30.87, 30.2, 31.99, 35.71], "audiomae_on_audioset": [null, [["music", 50.95], ["speech", 7.71], ["breaking", 6.06]], [["music", 55.61], ["throbbing", 24.32], ["hum", 3.8]], [["music", 70.18], ["speech", 12.42], ["thunk", 1.65]], [["music", 55.17], ["speech", 10.46], ["didgeridoo", 10.04]]], "duration": [48.06, 30.0, 12.24, 7.14, 10.05]} \ No newline at end of file diff --git a/annotations_filtered/u4gz2yNW_Go_filtered.json b/annotations_filtered/u4gz2yNW_Go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2aebe7b62b62da8c1ffdd4d9c535087a0a4b7c0 --- /dev/null +++ b/annotations_filtered/u4gz2yNW_Go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 51.56], [52.0, 75.05], [76.0, 88.92], [93.0, 95.27], [97.0, 97.02], [98.0, 99.3], [100.0, 102.66], [104.0, 105.22], [105.0, 107.82], [109.0, 114.24], [118.0, 132.44], [135.0, 140.63], [147.0, 151.38], [152.0, 152.74], [156.0, 163.56], [168.0, 168.27], [176.0, 175.98], [176.0, 176.01]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [32.44, 31.81, 32.09, 31.36, 0.0, 0.0, 32.5, 0.0, 32.9, 31.6, 30.99, 30.78, 30.62, 0.0, 30.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 21.6], ["duck", 14.95], ["quack", 10.51]], [["quack", 46.3], ["music", 18.85], ["animal", 9.53]], [["speech", 37.86], ["music", 26.37], ["fly, housefly", 7.02]], [["livestock, farm animals, working animals", 17.86], ["mosquito", 15.15], ["fly, housefly", 13.81]], null, null, [["music", 71.86], ["musical instrument", 5.42], ["drum", 2.23]], null, [["speech", 34.24], ["music", 23.73], ["fart", 15.55]], [["music", 19.63], ["speech", 13.46], ["fly, housefly", 11.72]], [["cattle, bovinae", 30.83], ["livestock, farm animals, working animals", 26.37], ["moo", 19.11]], [["honk", 42.34], ["goose", 21.57], ["music", 17.53]], [["music", 43.17], ["speech", 30.33], ["whack, thwack", 4.43]], null, [["cattle, bovinae", 53.16], ["moo", 20.71], ["livestock, farm animals, working animals", 18.58]], null, null, null], "duration": [3.56, 23.05, 12.92, 2.27, 0.02, 1.3, 2.66, 1.22, 2.82, 5.24, 14.44, 5.63, 4.38, 0.74, 7.56, 0.27, -0.02, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/u56OqFjs1dg_filtered.json b/annotations_filtered/u56OqFjs1dg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7510932b6eff0573b42df0ceea4822829c822eb --- /dev/null +++ b/annotations_filtered/u56OqFjs1dg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [2.0, 3.99], [5.0, 6.78], [8.0, 9.04], [11.0, 12.31], [14.0, 14.86], [16.0, 17.49], [18.0, 19.13], [20.0, 20.83], [22.0, 23.82], [25.0, 25.44], [28.0, 36.88], [38.0, 39.75], [40.0, 41.91], [43.0, 43.33], [49.0, 51.14], [52.0, 53.05], [54.0, 54.41], [64.0, 69.31], [71.0, 71.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 35.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.31], ["livestock, farm animals, working animals", 9.52], ["goat", 8.83]], null], "duration": [0.44, 1.99, 1.78, 1.04, 1.31, 0.86, 1.49, 1.13, 0.83, 1.82, 0.44, 8.88, 1.75, 1.91, 0.33, 2.14, 1.05, 0.41, 5.31, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/u5hpQ0KeRgY_filtered.json b/annotations_filtered/u5hpQ0KeRgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73ea6acd83ac0fe9c8445ae0fcff19cb1ae7f2b2 --- /dev/null +++ b/annotations_filtered/u5hpQ0KeRgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.37], [35.0, 35.68], [37.0, 47.88], [49.0, 55.58], [56.0, 57.94], [61.0, 61.72], [62.0, 64.25], [66.0, 67.53], [69.0, 70.01], [74.0, 75.52], [77.0, 77.62], [78.0, 79.47], [89.0, 89.53], [94.0, 94.53], [95.0, 95.0], [96.0, 109.14], [110.0, 117.53], [119.0, 127.2], [128.0, 130.08], [131.0, 131.95], [133.0, 133.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.22, 95.78, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 53.47, 97.33, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.68, 10.88, 6.58, 1.94, 0.72, 2.25, 1.53, 1.01, 1.52, 0.62, 1.47, 0.53, 0.53, 0.0, 13.14, 7.53, 8.2, 2.08, 0.95, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/u6GTs78NHzQ_filtered.json b/annotations_filtered/u6GTs78NHzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee7919531c675610097ec8eca6588288ea875d2a --- /dev/null +++ b/annotations_filtered/u6GTs78NHzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.4], [29.0, 29.4], [45.0, 50.03]], "keep_status": [false, false, false], "silence_prob": [29.89, 0.0, 30.13], "audiomae_on_audioset": [[["speech", 45.44], ["music", 35.23], ["hum", 3.9]], null, [["livestock, farm animals, working animals", 71.25], ["cattle, bovinae", 16.12], ["moo", 6.78]]], "duration": [20.4, 0.4, 5.03]} \ No newline at end of file diff --git a/annotations_filtered/u6HHla9ApmI_filtered.json b/annotations_filtered/u6HHla9ApmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..594308a3a88286c26ca2083b2666b9e5a207e78a --- /dev/null +++ b/annotations_filtered/u6HHla9ApmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.91], [23.0, 23.21], [23.0, 23.45], [29.0, 30.97], [32.0, 34.35], [36.0, 36.17], [40.0, 42.28], [47.0, 55.39], [61.0, 61.18], [62.0, 65.43], [68.0, 69.03], [79.0, 80.38], [83.0, 83.66], [86.0, 86.8], [87.0, 89.19], [92.0, 93.93], [104.0, 104.82], [110.0, 114.29], [116.0, 117.15], [118.0, 118.2], [124.0, 125.47], [126.0, 127.57], [129.0, 129.25], [137.0, 137.54], [141.0, 141.1], [141.0, 141.15]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.79, 0.0, 30.92, 30.82, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 35.64, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.73], ["speech", 23.03], ["boing", 4.98]], null, [["music", 47.2], ["boing", 17.78], ["livestock, farm animals, working animals", 3.69]], [["music", 75.15], ["boing", 5.49], ["speech", 4.9]], null, [["music", 38.51], ["speech", 18.3], ["mosquito", 5.39]], null, null, null, null, [["music", 38.53], ["speech", 25.83], ["boing", 17.83]], null, null, [["speech", 51.31], ["music", 8.1], ["sidetone", 7.08]], null, null, null, null, null, null, null, null], "duration": [1.91, 0.21, 0.45, 1.97, 2.35, 0.17, 2.28, 8.39, 0.18, 3.43, 1.03, 1.38, 0.66, 0.8, 2.19, 1.93, 0.82, 4.29, 1.15, 0.2, 1.47, 1.57, 0.25, 0.54, 0.1, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/u6IAct0ow4c_filtered.json b/annotations_filtered/u6IAct0ow4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2773f0c27d9fa0d2d05e4fd4482011838cab6b36 --- /dev/null +++ b/annotations_filtered/u6IAct0ow4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.84], [24.0, 24.85], [40.0, 39.97], [42.0, 41.72], [50.0, 51.36], [54.0, 64.94], [67.0, 70.95], [73.0, 75.54], [77.0, 85.13], [89.0, 89.63], [93.0, 95.62], [102.0, 107.6], [115.0, 116.34], [117.0, 119.03], [123.0, 123.63], [130.0, 130.2], [131.0, 131.26], [132.0, 132.36], [133.0, 133.93], [143.0, 144.26]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.97, 28.28, 40.33, 30.51, 0.0, 33.16, 34.93, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 31.35], ["speech", 24.0], ["mains hum", 15.3]], [["didgeridoo", 44.8], ["boing", 7.92], ["music", 7.58]], [["speech", 29.74], ["civil defense siren", 19.09], ["singing bowl", 10.71]], [["explosion", 16.81], ["music", 11.81], ["hum", 6.89]], null, [["speech", 75.91], ["music", 12.04], ["inside, large room or hall", 1.45]], [["music", 53.61], ["hum", 11.43], ["ambient music", 6.42]], null, [["hum", 31.0], ["mains hum", 16.94], ["speech", 11.41]], null, null, null, null, null, null], "duration": [-0.16, 0.85, -0.03, -0.28, 1.36, 10.94, 3.95, 2.54, 8.13, 0.63, 2.62, 5.6, 1.34, 2.03, 0.63, 0.2, 0.26, 0.36, 0.93, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/u6W5OFK9jpU_filtered.json b/annotations_filtered/u6W5OFK9jpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a185a0409a323b633774e560ec2c4ce1f998bd43 --- /dev/null +++ b/annotations_filtered/u6W5OFK9jpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [13.0, 13.9], [21.0, 21.86], [25.0, 25.62], [45.0, 46.08], [49.0, 52.15], [54.0, 56.05], [60.0, 61.42]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.18, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 32.81], ["moo", 24.02], ["livestock, farm animals, working animals", 18.48]], null, null], "duration": [1.02, 0.9, 0.86, 0.62, 1.08, 3.15, 2.05, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/u73HoUZD7tc_filtered.json b/annotations_filtered/u73HoUZD7tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e65d9b8cc0a1bae60be18dac67b6df38a0d6b4c1 --- /dev/null +++ b/annotations_filtered/u73HoUZD7tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.03], [4.0, 5.39], [6.0, 7.5], [9.0, 11.06], [12.0, 13.02], [21.0, 21.09], [28.0, 28.41], [29.0, 28.83], [33.0, 33.03], [35.0, 36.91], [38.0, 38.11], [48.0, 50.16], [59.0, 59.56], [65.0, 66.48], [72.0, 73.87], [77.0, 77.33], [80.0, 82.02], [88.0, 92.28], [94.0, 95.39], [99.0, 99.91], [104.0, 105.54], [107.0, 107.45], [108.0, 108.3], [111.0, 110.73], [112.0, 113.46], [117.0, 117.42], [121.0, 121.74], [124.0, 126.23], [127.0, 127.8], [128.0, 128.73], [131.0, 130.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 99.36, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 1.39, 1.5, 2.06, 1.02, 0.09, 0.41, -0.17, 0.03, 1.91, 0.11, 2.16, 0.56, 1.48, 1.87, 0.33, 2.02, 4.28, 1.39, 0.91, 1.54, 0.45, 0.3, -0.27, 1.46, 0.42, 0.74, 2.23, 0.8, 0.73, -0.35]} \ No newline at end of file diff --git a/annotations_filtered/u74DpEZeHbg_filtered.json b/annotations_filtered/u74DpEZeHbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..873bc21467c5d3525e9df1d084347b656336ff85 --- /dev/null +++ b/annotations_filtered/u74DpEZeHbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [6.0, 7.15], [11.0, 11.31], [13.0, 12.78], [29.0, 29.47], [30.0, 30.38], [31.0, 31.8], [34.0, 34.35], [36.0, 36.39], [38.0, 42.09], [51.0, 50.82], [54.0, 54.72], [63.0, 64.29], [84.0, 84.48], [90.0, 91.05], [92.0, 106.89], [109.0, 110.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.0], ["hum", 11.54], ["music", 4.13]], null], "duration": [1.0, 1.15, 0.31, -0.22, 0.47, 0.38, 0.8, 0.35, 0.39, 4.09, -0.18, 0.72, 1.29, 0.48, 1.05, 14.89, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/u7DV5coBXSA_filtered.json b/annotations_filtered/u7DV5coBXSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8450da1b303cea1a75f58fd0f093a57e7e566c7e --- /dev/null +++ b/annotations_filtered/u7DV5coBXSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.54], [11.0, 12.75], [15.0, 15.85], [18.0, 20.34], [21.0, 20.97], [23.0, 22.92], [24.0, 25.03], [31.0, 32.43], [34.0, 39.78], [40.0, 60.24], [61.0, 60.81], [65.0, 75.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 99.16, 65.2, 0.0, 48.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 52.71], ["singing bowl", 21.99], ["chirp tone", 13.24]]], "duration": [-0.46, 1.75, 0.85, 2.34, -0.03, -0.08, 1.03, 1.43, 5.78, 20.24, -0.19, 10.25]} \ No newline at end of file diff --git a/annotations_filtered/u7IXETT9OEQ_filtered.json b/annotations_filtered/u7IXETT9OEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49e3a86571ab1938f77b7ef456aadb44708364b6 --- /dev/null +++ b/annotations_filtered/u7IXETT9OEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.86], [8.0, 8.02], [11.0, 11.45], [13.0, 13.47], [17.0, 17.56], [18.0, 19.2], [21.0, 22.35], [26.0, 27.01], [28.0, 30.6], [32.0, 32.58], [33.0, 34.08], [35.0, 40.15], [41.0, 41.94], [45.0, 45.49], [49.0, 50.97], [54.0, 56.86], [60.0, 60.74], [66.0, 66.68], [68.0, 69.15], [71.0, 72.81], [74.0, 78.49], [79.0, 80.22], [81.0, 83.66], [88.0, 89.73], [92.0, 93.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 58.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.02, 0.45, 0.47, 0.56, 1.2, 1.35, 1.01, 2.6, 0.58, 1.08, 5.15, 0.94, 0.49, 1.97, 2.86, 0.74, 0.68, 1.15, 1.81, 4.49, 1.22, 2.66, 1.73, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/u7kInn-7hcA_filtered.json b/annotations_filtered/u7kInn-7hcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fb55f5d17e83f5b59c2e55e64596fe0301fcc37 --- /dev/null +++ b/annotations_filtered/u7kInn-7hcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.31], [23.0, 25.66], [27.0, 28.09], [38.0, 38.43], [49.0, 50.01], [51.0, 51.0], [57.0, 61.48], [62.0, 65.4], [66.0, 74.9], [83.0, 84.75], [102.0, 101.97], [103.0, 105.24], [108.0, 108.99], [112.0, 114.67], [115.0, 122.99]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 40.79, 0.0, 0.0, 0.0, 0.0, 33.88, 38.74, 42.33, 0.0, 0.0, 30.56, 0.0, 30.77, 30.15], "audiomae_on_audioset": [null, [["music", 55.37], ["theremin", 18.62], ["mantra", 3.13]], null, null, null, null, [["music", 45.24], ["theremin", 21.53], ["synthesizer", 4.93]], [["music", 54.11], ["theremin", 22.21], ["synthesizer", 2.23]], [["music", 36.22], ["effects unit", 10.95], ["chorus effect", 6.29]], null, null, [["music", 61.77], ["carnatic music", 8.25], ["musical instrument", 3.97]], null, [["music", 73.98], ["didgeridoo", 6.62], ["foghorn", 1.19]], [["music", 57.82], ["theremin", 10.02], ["yodeling", 7.94]]], "duration": [0.31, 2.66, 1.09, 0.43, 1.01, 0.0, 4.48, 3.4, 8.9, 1.75, -0.03, 2.24, 0.99, 2.67, 7.99]} \ No newline at end of file diff --git a/annotations_filtered/u7tSASIBz4Y_filtered.json b/annotations_filtered/u7tSASIBz4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f525064ae71937ee58a623320c890a31daf1a09 --- /dev/null +++ b/annotations_filtered/u7tSASIBz4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.09], [13.0, 62.23], [64.0, 64.94], [66.0, 100.01]], "keep_status": [false, false, false, false], "silence_prob": [78.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [3.09, 49.23, 0.94, 34.01]} \ No newline at end of file diff --git a/annotations_filtered/u7yQ7qs6Zew_filtered.json b/annotations_filtered/u7yQ7qs6Zew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4775d4538ab3215b5f906661716ce0790ecf43f --- /dev/null +++ b/annotations_filtered/u7yQ7qs6Zew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 62.45], [65.0, 67.71], [68.0, 70.14], [71.0, 76.54], [81.0, 82.12], [92.0, 92.3], [98.0, 100.18], [102.0, 102.27], [103.0, 103.6], [105.0, 105.6], [109.0, 111.06], [112.0, 112.41], [116.0, 116.43], [117.0, 118.05], [124.0, 128.16], [128.0, 128.33], [129.0, 130.35], [134.0, 135.11], [139.0, 140.93], [143.0, 146.01], [148.0, 149.03], [150.0, 152.14], [155.0, 157.92], [159.0, 160.46], [162.0, 163.09], [165.0, 166.45], [167.0, 167.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 78.21, 77.36, 69.2, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 45.92, 0.0, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 39.05, 0.0, 47.74, 43.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 28.85], ["cattle, bovinae", 9.64], ["theremin", 8.08]], null, null, null, [["music", 42.37], ["speech", 14.72], ["hum", 9.52]], null, null, null, null, [["music", 47.86], ["throbbing", 16.53], ["hum", 5.48]], null, [["music", 31.96], ["hum", 22.75], ["throbbing", 11.16]], [["music", 27.72], ["speech", 23.19], ["throbbing", 10.93]], null, null, null, null], "duration": [50.45, 2.71, 2.14, 5.54, 1.12, 0.3, 2.18, 0.27, 0.6, 0.6, 2.06, 0.41, 0.43, 1.05, 4.16, 0.33, 1.35, 1.11, 1.93, 3.01, 1.03, 2.14, 2.92, 1.46, 1.09, 1.45, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/u83fkqXPIGE_filtered.json b/annotations_filtered/u83fkqXPIGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71715139c606cb4330a2bd92abcaade5efa2a3eb --- /dev/null +++ b/annotations_filtered/u83fkqXPIGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [5.0, 4.9], [6.0, 6.51], [8.0, 9.46], [10.0, 11.01], [11.0, 13.04], [16.0, 17.68], [19.0, 19.11], [20.0, 20.07], [21.0, 21.63], [22.0, 22.33], [23.0, 46.6], [48.0, 48.1], [50.0, 50.25], [51.0, 52.59], [55.0, 65.25], [71.0, 84.54], [85.0, 85.01], [92.0, 100.14], [102.0, 103.52], [104.0, 104.26], [105.0, 105.27], [107.0, 107.94], [109.0, 110.02], [112.0, 125.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 36.59, 0.0, 0.0, 0.0, 55.46, 57.17, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 20.99], ["music", 16.31], ["electric shaver, electric razor", 8.82]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, -0.1, 0.51, 1.46, 1.01, 2.04, 1.68, 0.11, 0.07, 0.63, 0.33, 23.6, 0.1, 0.25, 1.59, 10.25, 13.54, 0.01, 8.14, 1.52, 0.26, 0.27, 0.94, 1.02, 13.85]} \ No newline at end of file diff --git a/annotations_filtered/u8QMY9JKlDk_filtered.json b/annotations_filtered/u8QMY9JKlDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abca1afda70e2dd5ca9726ec7d89c2b67d23af24 --- /dev/null +++ b/annotations_filtered/u8QMY9JKlDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 42.8], [45.0, 72.74], [73.0, 88.4]], "keep_status": [true, true, false], "silence_prob": [30.99, 30.8, 33.14], "audiomae_on_audioset": [[["speech", 29.64], ["music", 13.11], ["animal", 9.92]], [["noise", 44.52], ["sidetone", 5.56], ["hum", 5.26]], [["music", 46.81], ["buzz", 16.26], ["hum", 9.37]]], "duration": [4.8, 27.74, 15.4]} \ No newline at end of file diff --git a/annotations_filtered/u8TwN5M1fEY_filtered.json b/annotations_filtered/u8TwN5M1fEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b13094219ef4cfe3c2a9bfe2a0d6bdf97add905 --- /dev/null +++ b/annotations_filtered/u8TwN5M1fEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.65], [9.0, 9.93], [11.0, 11.6], [12.0, 13.61], [14.0, 16.48], [17.0, 17.64], [22.0, 23.13], [29.0, 29.88], [32.0, 32.39], [34.0, 34.79], [35.0, 36.41], [39.0, 38.97], [42.0, 42.21], [43.0, 43.77], [45.0, 45.79], [47.0, 48.3], [50.0, 51.85], [54.0, 54.68], [56.0, 56.05], [58.0, 58.29], [59.0, 59.95], [62.0, 63.76], [69.0, 69.13], [70.0, 70.38], [72.0, 72.55], [74.0, 74.55], [75.0, 75.51], [76.0, 76.96], [78.0, 80.96], [82.0, 82.27], [84.0, 84.92], [86.0, 88.13], [89.0, 90.9], [91.0, 94.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 100.0, 0.0, 74.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.93, 0.6, 1.61, 2.48, 0.64, 1.13, 0.88, 0.39, 0.79, 1.41, -0.03, 0.21, 0.77, 0.79, 1.3, 1.85, 0.68, 0.05, 0.29, 0.95, 1.76, 0.13, 0.38, 0.55, 0.55, 0.51, 0.96, 2.96, 0.27, 0.92, 2.13, 1.9, 3.31]} \ No newline at end of file diff --git a/annotations_filtered/u8oHCJ8LxtY_filtered.json b/annotations_filtered/u8oHCJ8LxtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9371dd4328b4790de46b3f3240e6ca31279bff6b --- /dev/null +++ b/annotations_filtered/u8oHCJ8LxtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [5.0, 7.5], [9.0, 12.18], [14.0, 20.16], [21.0, 24.76], [26.0, 28.98], [31.0, 33.51], [36.0, 38.77], [41.0, 46.43], [48.0, 58.9]], "keep_status": [false, true, true, true, true, false, false, false, true, false], "silence_prob": [0.0, 32.27, 44.93, 34.32, 41.36, 63.85, 47.82, 59.86, 49.87, 59.07], "audiomae_on_audioset": [null, [["music", 34.15], ["theremin", 5.66], ["hum", 4.63]], [["music", 40.46], ["effects unit", 11.03], ["synthesizer", 5.89]], [["music", 29.07], ["hum", 12.23], ["mains hum", 9.4]], [["music", 37.12], ["speech", 22.39], ["hum", 10.37]], null, [["speech", 54.65], ["music", 17.13], ["sidetone", 3.74]], null, [["music", 34.52], ["hum", 16.4], ["speech", 6.26]], null], "duration": [0.24, 2.5, 3.18, 6.16, 3.76, 2.98, 2.51, 2.77, 5.43, 10.9]} \ No newline at end of file diff --git a/annotations_filtered/u9A2CYMFfNo_filtered.json b/annotations_filtered/u9A2CYMFfNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9f2b31fab88b841b332896a17cb43ccf0f8d1cb --- /dev/null +++ b/annotations_filtered/u9A2CYMFfNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.99], [11.0, 14.88], [16.0, 16.75], [18.0, 18.81], [21.0, 30.06], [31.0, 33.94], [35.0, 35.88], [37.0, 38.87], [39.0, 39.93], [41.0, 41.66], [42.0, 42.52], [46.0, 48.66], [51.0, 52.05], [54.0, 54.08], [54.0, 54.46], [55.0, 59.04], [60.0, 68.55], [74.0, 76.84], [78.0, 80.23], [83.0, 84.96], [90.0, 92.47], [96.0, 117.24], [119.0, 119.43], [129.0, 128.88], [131.0, 130.99]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 40.93, 0.0, 0.0, 33.46, 37.88, 0.0, 0.0, 0.0, 0.0, 0.0, 45.82, 0.0, 0.0, 0.0, 35.62, 32.89, 52.16, 44.09, 0.0, 33.97, 38.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.57], ["speech", 16.04], ["throbbing", 3.5]], null, null, [["music", 39.4], ["musical instrument", 10.32], ["brass instrument", 8.33]], [["croak", 23.46], ["music", 23.39], ["speech", 14.76]], null, null, null, null, null, [["music", 69.91], ["throbbing", 6.28], ["hum", 4.64]], null, null, null, [["music", 58.6], ["speech", 15.81], ["synthesizer", 4.78]], [["music", 58.13], ["speech", 12.35], ["musical instrument", 3.21]], null, [["music", 66.11], ["synthesizer", 5.14], ["speech", 3.94]], null, [["music", 18.17], ["speech", 15.11], ["fart", 4.86]], [["music", 65.63], ["quack", 13.13], ["animal", 4.96]], null, null, null], "duration": [0.99, 3.88, 0.75, 0.81, 9.06, 2.94, 0.88, 1.87, 0.93, 0.66, 0.52, 2.66, 1.05, 0.08, 0.46, 4.04, 8.55, 2.84, 2.23, 1.96, 2.47, 21.24, 0.43, -0.12, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/u9O_Xs8wAZk_filtered.json b/annotations_filtered/u9O_Xs8wAZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30ebb2b78c757924d91e1bba4a51139331b713c6 --- /dev/null +++ b/annotations_filtered/u9O_Xs8wAZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 52.1], [56.0, 64.1], [65.0, 71.1], [72.0, 72.44], [73.0, 80.77], [82.0, 156.95], [157.0, 158.35]], "keep_status": [false, true, true, false, false, false, false], "silence_prob": [0.0, 32.89, 31.03, 0.0, 31.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 27.79], ["speech", 10.52], ["fart", 8.25]], [["music", 47.93], ["didgeridoo", 11.55], ["musical instrument", 5.96]], null, [["speech", 31.19], ["mains hum", 21.07], ["hum", 18.85]], null, null], "duration": [34.1, 8.1, 6.1, 0.44, 7.77, 74.95, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/u9S41Kplsbs_filtered.json b/annotations_filtered/u9S41Kplsbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02c4eb407a6dc5053d820750b64f81437236a57d --- /dev/null +++ b/annotations_filtered/u9S41Kplsbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [7.0, 8.29], [13.0, 16.78], [21.0, 23.9], [26.0, 27.04], [28.0, 28.04], [31.0, 31.77], [34.0, 36.9], [41.0, 42.97], [45.0, 52.12], [54.0, 56.52], [60.0, 60.3], [63.0, 64.3], [65.0, 65.6], [71.0, 71.74], [78.0, 85.62], [86.0, 85.65], [86.0, 87.71], [89.0, 90.96], [92.0, 96.67], [99.0, 100.16], [104.0, 106.88], [112.0, 118.45], [120.0, 125.12], [127.0, 129.34], [130.0, 132.51], [137.0, 138.72], [143.0, 145.32], [148.0, 150.13], [151.0, 152.25], [154.0, 155.73], [159.0, 160.15], [161.0, 163.46], [164.0, 165.55], [168.0, 172.12], [186.0, 187.25], [188.0, 188.43], [190.0, 190.73], [192.0, 193.97], [196.0, 198.51], [201.0, 201.6]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.04, 59.07, 0.0, 0.0, 0.0, 84.25, 0.0, 46.15, 46.54, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 0.0, 34.09, 0.0, 41.2, 35.97, 51.55, 50.81, 30.15, 0.0, 66.03, 76.37, 0.0, 0.0, 0.0, 71.43, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 22.58], ["noise", 12.83], ["effects unit", 5.67]], [["speech", 33.68], ["sidetone", 7.94], ["hum", 5.6]], null, null, null, null, [["speech", 57.24], ["music", 16.37], ["mains hum", 2.79]], null, null, null, [["speech", 30.34], ["music", 18.42], ["hum", 16.35]], null, [["mains hum", 21.7], ["hum", 17.49], ["music", 11.9]], [["music", 40.9], ["didgeridoo", 10.55], ["speech", 9.78]], null, null, [["cattle, bovinae", 31.4], ["moo", 25.31], ["livestock, farm animals, working animals", 20.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.29, 3.78, 2.9, 1.04, 0.04, 0.77, 2.9, 1.97, 7.12, 2.52, 0.3, 1.3, 0.6, 0.74, 7.62, -0.35, 1.71, 1.96, 4.67, 1.16, 2.88, 6.45, 5.12, 2.34, 2.51, 1.72, 2.32, 2.13, 1.25, 1.73, 1.15, 2.46, 1.55, 4.12, 1.25, 0.43, 0.73, 1.97, 2.51, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/uA1Kloz4Ics_filtered.json b/annotations_filtered/uA1Kloz4Ics_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..195df28ad79041712a21bd0bf40e3c349ea8ac95 --- /dev/null +++ b/annotations_filtered/uA1Kloz4Ics_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.24], [2.0, 2.42], [4.0, 4.83], [6.0, 6.93], [11.0, 12.01], [13.0, 13.69], [16.0, 20.17], [22.0, 22.52], [26.0, 27.9], [29.0, 30.48], [31.0, 31.29], [33.0, 35.63], [36.0, 37.18], [38.0, 40.26], [45.0, 45.0], [45.0, 46.14], [50.0, 54.62], [56.0, 57.86], [60.0, 62.55], [63.0, 64.45], [65.0, 65.99], [69.0, 71.27], [74.0, 74.26], [77.0, 84.25], [95.0, 96.21], [98.0, 98.51], [99.0, 98.73], [103.0, 103.77], [111.0, 112.13], [114.0, 114.29], [115.0, 117.0], [119.0, 119.94], [122.0, 123.31], [124.0, 124.82], [126.0, 126.23], [127.0, 128.65], [129.0, 142.65], [146.0, 146.96], [148.0, 148.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 53.84, 0.0, 0.0, 99.95, 0.0, 100.0, 0.0, 0.0, 96.66, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.42, 0.83, 0.93, 1.01, 0.69, 4.17, 0.52, 1.9, 1.48, 0.29, 2.63, 1.18, 2.26, 0.0, 1.14, 4.62, 1.86, 2.55, 1.45, 0.99, 2.27, 0.26, 7.25, 1.21, 0.51, -0.27, 0.77, 1.13, 0.29, 2.0, 0.94, 1.31, 0.82, 0.23, 1.65, 13.65, 0.96, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/uA7BbE1cF2U_filtered.json b/annotations_filtered/uA7BbE1cF2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12095b09b3a510da89faab4810ad409bd12bcda7 --- /dev/null +++ b/annotations_filtered/uA7BbE1cF2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.49], [11.0, 13.04], [16.0, 18.27], [22.0, 21.86], [23.0, 23.41], [25.0, 25.37], [28.0, 28.17], [30.0, 30.0], [38.0, 38.2], [58.0, 76.44], [80.0, 81.28], [87.0, 87.47], [88.0, 89.4], [90.0, 108.73], [109.0, 108.77], [117.0, 126.0], [131.0, 131.8], [138.0, 137.78], [139.0, 143.04], [149.0, 149.71], [151.0, 155.06], [156.0, 161.57], [165.0, 167.17], [168.0, 169.1], [171.0, 174.75], [177.0, 179.19], [182.0, 181.9], [183.0, 183.9], [185.0, 186.68], [189.0, 193.53], [194.0, 195.89], [197.0, 202.73], [203.0, 230.47]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [29.85, 46.09, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.09, 0.0, 0.0, 0.0, 33.45, 0.0, 35.59, 0.0, 0.0, 32.44, 0.0, 96.42, 34.4, 56.33, 0.0, 57.32, 66.03, 0.0, 0.0, 0.0, 67.89, 0.0, 47.82, 32.31], "audiomae_on_audioset": [[["music", 42.9], ["carnatic music", 11.72], ["sitar", 2.67]], [["speech", 41.38], ["music", 15.52], ["didgeridoo", 4.68]], [["music", 38.2], ["speech", 21.23], ["theremin", 9.28]], null, null, null, null, null, null, [["music", 76.15], ["hum", 3.37], ["didgeridoo", 1.75]], null, null, null, [["music", 41.8], ["theremin", 9.2], ["synthesizer", 6.76]], null, [["speech", 38.75], ["music", 30.98], ["whale vocalization", 6.5]], null, null, [["moo", 31.15], ["cattle, bovinae", 20.19], ["livestock, farm animals, working animals", 18.32]], null, null, [["grunt", 29.28], ["music", 22.43], ["groan", 15.84]], null, null, null, null, null, null, null, null, null, [["music", 29.1], ["hum", 22.51], ["speech", 10.66]], [["music", 44.47], ["buzz", 29.99], ["electric shaver, electric razor", 4.57]]], "duration": [5.49, 2.04, 2.27, -0.14, 0.41, 0.37, 0.17, 0.0, 0.2, 18.44, 1.28, 0.47, 1.4, 18.73, -0.23, 9.0, 0.8, -0.22, 4.04, 0.71, 4.06, 5.57, 2.17, 1.1, 3.75, 2.19, -0.1, 0.9, 1.68, 4.53, 1.89, 5.73, 27.47]} \ No newline at end of file diff --git a/annotations_filtered/uAERYfeiYBc_filtered.json b/annotations_filtered/uAERYfeiYBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db3d3698723c54d1828ecd4fef07e24c69a6c0e6 --- /dev/null +++ b/annotations_filtered/uAERYfeiYBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [23.0, 23.82], [25.0, 30.18], [31.0, 32.51], [33.0, 37.4], [46.0, 45.69], [48.0, 48.91], [59.0, 60.12], [61.0, 61.2], [62.0, 62.97], [66.0, 66.6], [68.0, 68.93], [70.0, 70.46], [71.0, 72.33], [73.0, 73.8], [75.0, 75.47], [77.0, 77.62], [82.0, 84.59], [87.0, 88.33], [91.0, 91.62], [94.0, 96.92], [98.0, 98.39], [101.0, 102.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.35, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 82.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["thunk", 11.5], ["music", 8.94], ["glass", 7.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.82, 5.18, 1.51, 4.4, -0.31, 0.91, 1.12, 0.2, 0.97, 0.6, 0.93, 0.46, 1.33, 0.8, 0.47, 0.62, 2.59, 1.33, 0.62, 2.92, 0.39, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/uAMrR05Xil8_filtered.json b/annotations_filtered/uAMrR05Xil8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..357ea728dcc654ec602cf3d2a5814f273cccca56 --- /dev/null +++ b/annotations_filtered/uAMrR05Xil8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [18.0, 22.28], [23.0, 24.85], [25.0, 27.09], [54.0, 54.18], [63.0, 65.45], [76.0, 76.86], [78.0, 80.32], [81.0, 81.13], [82.0, 83.05], [88.0, 89.41], [94.0, 94.98], [97.0, 98.19], [107.0, 107.82], [109.0, 110.22], [111.0, 111.1], [114.0, 118.83], [121.0, 127.87], [128.0, 128.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 50.26, 0.0, 60.32, 0.0, 64.97, 0.0, 54.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.93, 55.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.84], ["mosquito", 3.93], ["fly, housefly", 2.93]], null, null], "duration": [0.06, 4.28, 1.85, 2.09, 0.18, 2.45, 0.86, 2.32, 0.13, 1.05, 1.41, 0.98, 1.19, 0.82, 1.22, 0.1, 4.83, 6.87, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/uAS_k95ZRUk_filtered.json b/annotations_filtered/uAS_k95ZRUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..029d95e1d38e7075c71f535c4b4190ab75507cb3 --- /dev/null +++ b/annotations_filtered/uAS_k95ZRUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.73], [6.0, 7.96], [13.0, 15.82], [21.0, 20.97], [26.0, 27.26], [31.0, 31.4], [39.0, 39.63], [41.0, 43.16], [45.0, 46.25], [50.0, 50.33], [55.0, 55.48], [59.0, 60.47], [63.0, 63.53]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [52.45, 0.0, 43.35, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.86], ["hum", 18.84], ["whale vocalization", 13.32]], null, null, null, null, [["music", 31.04], ["speech", 10.81], ["synthesizer", 10.26]], null, null, null, null, null], "duration": [3.73, 1.96, 2.82, -0.03, 1.26, 0.4, 0.63, 2.16, 1.25, 0.33, 0.48, 1.47, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/uAgvdtpmXBk_filtered.json b/annotations_filtered/uAgvdtpmXBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7de87b1ea6f6a9ff5f784b21ce3eb467fbafcc5 --- /dev/null +++ b/annotations_filtered/uAgvdtpmXBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.26], [12.0, 13.53], [15.0, 15.21], [17.0, 17.41], [21.0, 21.41], [23.0, 23.38], [24.0, 24.68], [27.0, 27.97], [30.0, 30.37], [33.0, 32.76], [36.0, 36.19], [40.0, 40.09], [42.0, 42.77], [46.0, 45.98], [47.0, 48.29], [59.0, 67.61], [69.0, 72.93], [75.0, 78.09], [81.0, 90.32], [91.0, 93.97], [95.0, 95.15], [96.0, 108.55], [110.0, 113.86], [114.0, 114.57], [115.0, 115.77], [117.0, 117.05], [119.0, 120.09]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [41.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.98, 63.53, 83.88, 74.92, 53.59, 0.0, 84.07, 30.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 36.62], ["music", 18.25], ["hum", 10.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 23.15], ["whack, thwack", 12.68], ["crushing", 12.54]], null, null, null, null], "duration": [2.26, 1.53, 0.21, 0.41, 0.41, 0.38, 0.68, 0.97, 0.37, -0.24, 0.19, 0.09, 0.77, -0.02, 1.29, 8.61, 3.93, 3.09, 9.32, 2.97, 0.15, 12.55, 3.86, 0.57, 0.77, 0.05, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/uAjGtAOqMQw_filtered.json b/annotations_filtered/uAjGtAOqMQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b60b79efe9e355b45a5ce832ca834ee756407d17 --- /dev/null +++ b/annotations_filtered/uAjGtAOqMQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.83], [45.0, 52.03], [56.0, 61.13], [62.0, 62.4], [67.0, 77.77], [78.0, 80.18], [81.0, 83.76], [86.0, 89.51], [92.0, 93.92], [95.0, 95.07], [99.0, 113.88], [117.0, 122.52]], "keep_status": [false, true, true, false, true, false, true, true, false, false, false, true], "silence_prob": [32.37, 29.47, 30.48, 0.0, 29.15, 31.96, 31.67, 30.19, 0.0, 0.0, 29.75, 29.45], "audiomae_on_audioset": [[["music", 36.9], ["crack", 26.07], ["single-lens reflex camera", 10.71]], [["music", 22.0], ["thump, thud", 16.26], ["speech", 11.83]], [["music", 18.13], ["hiccup", 9.92], ["speech", 8.86]], null, [["music", 45.08], ["breaking", 12.23], ["speech", 10.92]], [["music", 58.24], ["didgeridoo", 7.96], ["musical instrument", 4.18]], [["music", 21.14], ["throbbing", 7.99], ["didgeridoo", 6.56]], [["speech", 19.81], ["music", 16.92], ["coin (dropping)", 11.7]], null, null, [["music", 69.23], ["sound effect", 4.91], ["hum", 4.87]], [["music", 31.96], ["mains hum", 7.96], ["hum", 7.07]]], "duration": [7.83, 7.03, 5.13, 0.4, 10.77, 2.18, 2.76, 3.51, 1.92, 0.07, 14.88, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/uAphWDkKWcg_filtered.json b/annotations_filtered/uAphWDkKWcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb387f53a118049882a21648016da9cfb32ed834 --- /dev/null +++ b/annotations_filtered/uAphWDkKWcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 42.72], [45.0, 71.69], [73.0, 74.98], [80.0, 80.2], [80.0, 80.99], [82.0, 82.98], [89.0, 93.88], [94.0, 94.71], [97.0, 129.68], [130.0, 133.81], [134.0, 139.31], [143.0, 149.15], [150.0, 151.23], [153.0, 154.4], [156.0, 158.33], [159.0, 160.46], [165.0, 172.52]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.74, 87.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 96.66, 98.27, 95.78, 0.0, 0.0, 92.64, 0.0, 35.07], "audiomae_on_audioset": [[["music", 32.75], ["buzz", 21.27], ["insect", 7.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.46], ["synthesizer", 20.7], ["electronic music", 3.77]]], "duration": [19.72, 26.69, 1.98, 0.2, 0.99, 0.98, 4.88, 0.71, 32.68, 3.81, 5.31, 6.15, 1.23, 1.4, 2.33, 1.46, 7.52]} \ No newline at end of file diff --git a/annotations_filtered/uAroGB_YCmw_filtered.json b/annotations_filtered/uAroGB_YCmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d6b4208dfd9f081a5ef5a574026be6a8bf1311d --- /dev/null +++ b/annotations_filtered/uAroGB_YCmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.58], [32.0, 33.39], [34.0, 49.94], [57.0, 56.91], [59.0, 67.76], [69.0, 74.06], [78.0, 87.45], [91.0, 102.03], [103.0, 128.04]], "keep_status": [false, false, true, false, false, true, false, true, true], "silence_prob": [30.06, 0.0, 29.89, 0.0, 30.3, 30.36, 31.54, 30.56, 30.32], "audiomae_on_audioset": [[["music", 59.53], ["speech", 13.39], ["quack", 2.44]], null, [["music", 25.46], ["throbbing", 20.25], ["hum", 15.95]], null, [["speech", 50.49], ["music", 23.41], ["throbbing", 2.86]], [["speech", 40.91], ["music", 18.78], ["throbbing", 7.05]], [["music", 44.19], ["didgeridoo", 23.19], ["musical instrument", 5.68]], [["music", 55.7], ["didgeridoo", 7.14], ["musical instrument", 5.3]], [["music", 47.1], ["animal", 7.03], ["cattle, bovinae", 4.53]]], "duration": [17.58, 1.39, 15.94, -0.09, 8.76, 5.06, 9.45, 11.03, 25.04]} \ No newline at end of file diff --git a/annotations_filtered/uAtcsqDjOr8_filtered.json b/annotations_filtered/uAtcsqDjOr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..525219d8915f7b92510a18d3cfc64fc1fd81998e --- /dev/null +++ b/annotations_filtered/uAtcsqDjOr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 6.35], [11.0, 12.68], [14.0, 14.17], [17.0, 17.44], [19.0, 22.92], [27.0, 31.55], [34.0, 34.87], [37.0, 42.08], [46.0, 47.09], [48.0, 56.4], [57.0, 63.27], [65.0, 66.43], [67.0, 68.23], [69.0, 71.42], [72.0, 73.43], [75.0, 75.46], [77.0, 77.57], [78.0, 79.86], [80.0, 80.81], [82.0, 83.05], [84.0, 84.27], [85.0, 85.89], [90.0, 92.2], [98.0, 100.31], [101.0, 102.41], [103.0, 109.48], [112.0, 113.34], [114.0, 114.24], [117.0, 117.71], [118.0, 122.88], [128.0, 128.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 49.78, 0.0, 66.76, 0.0, 99.26, 98.99, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 86.64, 0.0, 99.85, 0.0, 0.0, 0.0, 97.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 39.76], ["fly, housefly", 17.12], ["sidetone", 8.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 1.35, 1.68, 0.17, 0.44, 3.92, 4.55, 0.87, 5.08, 1.09, 8.4, 6.27, 1.43, 1.23, 2.42, 1.43, 0.46, 0.57, 1.86, 0.81, 1.05, 0.27, 0.89, 2.2, 2.31, 1.41, 6.48, 1.34, 0.24, 0.71, 4.88, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/uB-53DTWD3k_filtered.json b/annotations_filtered/uB-53DTWD3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25b14a5d1b1440d1409e4ea0d6921496b801b01d --- /dev/null +++ b/annotations_filtered/uB-53DTWD3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [5.0, 15.53], [16.0, 22.87], [23.0, 23.41], [24.0, 27.33], [29.0, 51.58], [53.0, 57.84], [59.0, 66.23], [67.0, 78.27], [80.0, 80.62]], "keep_status": [false, true, false, false, true, false, true, true, true, false], "silence_prob": [0.0, 30.13, 28.56, 0.0, 30.25, 30.54, 38.6, 28.86, 29.1, 0.0], "audiomae_on_audioset": [null, [["buzz", 49.63], ["speech", 13.05], ["vehicle", 3.36]], [["speech", 59.96], ["vehicle", 8.44], ["boat, water vehicle", 6.81]], null, [["mains hum", 29.05], ["music", 20.94], ["hum", 17.09]], [["speech", 44.63], ["music", 26.94], ["mains hum", 9.99]], [["hum", 22.36], ["music", 16.8], ["mains hum", 16.2]], [["speech", 31.42], ["hum", 14.56], ["mains hum", 14.53]], [["speech", 33.49], ["vehicle", 16.86], ["boat, water vehicle", 7.45]], null], "duration": [0.7, 10.53, 6.87, 0.41, 3.33, 22.58, 4.84, 7.23, 11.27, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/uB2eggtlTfE_filtered.json b/annotations_filtered/uB2eggtlTfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8e99105b6f7077cb7122c6c969063147a9492b3 --- /dev/null +++ b/annotations_filtered/uB2eggtlTfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [4.0, 5.14], [8.0, 7.92], [11.0, 12.55], [15.0, 16.65], [20.0, 20.48], [22.0, 22.71], [28.0, 30.32], [34.0, 35.21], [39.0, 38.82], [42.0, 42.52], [43.0, 44.02], [45.0, 46.45], [47.0, 48.51], [49.0, 50.16], [54.0, 54.92], [57.0, 57.87], [60.0, 61.1], [62.0, 62.4], [64.0, 64.83], [65.0, 65.7], [70.0, 70.48], [76.0, 77.19], [80.0, 81.13], [85.0, 86.44], [88.0, 89.53], [91.0, 93.8], [95.0, 97.44], [98.0, 99.87], [101.0, 101.85], [107.0, 109.58], [112.0, 114.1], [116.0, 117.24], [118.0, 119.65], [121.0, 122.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 44.72, 0.0, 0.0, 62.68, 54.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 86.82], ["music", 3.08], ["radio", 1.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 13.59], ["music", 9.86], ["throbbing", 5.61]], null, null, null, null, null, null, null], "duration": [0.81, 1.14, -0.08, 1.55, 1.65, 0.48, 0.71, 2.32, 1.21, -0.18, 0.52, 1.02, 1.45, 1.51, 1.16, 0.92, 0.87, 1.1, 0.4, 0.83, 0.7, 0.48, 1.19, 1.13, 1.44, 1.53, 2.8, 2.44, 1.87, 0.85, 2.58, 2.1, 1.24, 1.65, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/uB6JMgU50J0_filtered.json b/annotations_filtered/uB6JMgU50J0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..881c3f4df3417b6986e726dc5994907f75e120fe --- /dev/null +++ b/annotations_filtered/uB6JMgU50J0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.56], [31.0, 31.56], [32.0, 37.05], [39.0, 46.18], [49.0, 51.48], [53.0, 56.08], [74.0, 74.82], [75.0, 86.44], [90.0, 142.87], [143.0, 145.74], [146.0, 154.16], [155.0, 155.49]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [34.3, 0.0, 37.52, 34.45, 31.55, 33.0, 0.0, 38.86, 0.0, 43.77, 36.39, 0.0], "audiomae_on_audioset": [[["music", 57.03], ["speech", 9.1], ["throbbing", 5.86]], null, [["music", 69.91], ["throbbing", 6.39], ["electronic music", 4.87]], [["hum", 32.78], ["throbbing", 28.51], ["music", 28.22]], [["music", 37.96], ["synthesizer", 18.32], ["throbbing", 10.56]], [["music", 65.31], ["didgeridoo", 9.2], ["throbbing", 3.54]], null, [["hum", 43.05], ["throbbing", 22.14], ["music", 9.57]], null, [["speech", 44.13], ["music", 21.69], ["pulse", 5.71]], [["music", 18.61], ["speech", 16.39], ["siren", 16.29]], null], "duration": [11.56, 0.56, 5.05, 7.18, 2.48, 3.08, 0.82, 11.44, 52.87, 2.74, 8.16, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/uBAd6Nfv3uE_filtered.json b/annotations_filtered/uBAd6Nfv3uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7e7f611e70f5af30d3e41518d0e141d7aaf8b23 --- /dev/null +++ b/annotations_filtered/uBAd6Nfv3uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [9.0, 12.06], [14.0, 14.96], [17.0, 21.15], [23.0, 24.6], [27.0, 27.13], [29.0, 31.24], [32.0, 33.08], [35.0, 38.03], [40.0, 55.48], [59.0, 63.46], [125.0, 125.56], [127.0, 126.99], [127.0, 127.72], [139.0, 145.25], [145.0, 145.3], [146.0, 158.45], [162.0, 178.97], [184.0, 184.52], [186.0, 200.55]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 32.63, 0.0, 32.42, 0.0, 0.0, 31.18, 0.0, 35.48, 32.26, 28.68, 0.0, 0.0, 0.0, 28.33, 0.0, 28.49, 28.92, 0.0, 29.2], "audiomae_on_audioset": [null, [["insect", 22.69], ["fly, housefly", 22.23], ["bee, wasp, etc.", 16.47]], null, [["livestock, farm animals, working animals", 36.78], ["moo", 31.22], ["cattle, bovinae", 27.46]], null, null, [["speech", 64.88], ["livestock, farm animals, working animals", 3.12], ["moo", 2.29]], null, [["moo", 41.96], ["cattle, bovinae", 37.93], ["livestock, farm animals, working animals", 13.36]], [["insect", 23.83], ["fly, housefly", 21.12], ["whale vocalization", 10.95]], [["didgeridoo", 56.29], ["music", 18.23], ["beatboxing", 6.39]], null, null, null, [["music", 78.13], ["didgeridoo", 3.22], ["throbbing", 2.33]], null, [["music", 65.65], ["speech", 4.9], ["electronic music", 4.67]], [["music", 56.48], ["speech", 6.61], ["electronic music", 5.94]], null, [["breaking", 21.0], ["speech", 17.49], ["buzz", 17.23]]], "duration": [0.42, 3.06, 0.96, 4.15, 1.6, 0.13, 2.24, 1.08, 3.03, 15.48, 4.46, 0.56, -0.01, 0.72, 6.25, 0.3, 12.45, 16.97, 0.52, 14.55]} \ No newline at end of file diff --git a/annotations_filtered/uBB3Cvxq5f8_filtered.json b/annotations_filtered/uBB3Cvxq5f8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18437fd0bc7965c0445f5a62adde034e141e44e7 --- /dev/null +++ b/annotations_filtered/uBB3Cvxq5f8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 34.28], [37.0, 39.53], [44.0, 45.89], [46.0, 50.03], [52.0, 55.21], [58.0, 59.17], [62.0, 61.86], [72.0, 73.72], [74.0, 79.2], [80.0, 80.03], [82.0, 82.78], [92.0, 93.36], [94.0, 95.37], [97.0, 97.8], [99.0, 99.01], [100.0, 100.58], [101.0, 103.89], [106.0, 106.15], [108.0, 109.98], [113.0, 114.17], [119.0, 126.27]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.12, 90.78, 0.0, 89.01, 85.72, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 99.87], "audiomae_on_audioset": [[["music", 48.68], ["hum", 9.6], ["throbbing", 5.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [28.28, 2.53, 1.89, 4.03, 3.21, 1.17, -0.14, 1.72, 5.2, 0.03, 0.78, 1.36, 1.37, 0.8, 0.01, 0.58, 2.89, 0.15, 1.98, 1.17, 7.27]} \ No newline at end of file diff --git a/annotations_filtered/uBFxCK913PM_filtered.json b/annotations_filtered/uBFxCK913PM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15b8bfb3f90e7afa795d00c43c53040dc8c7a5ba --- /dev/null +++ b/annotations_filtered/uBFxCK913PM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[69.0, 70.43], [70.0, 70.46], [77.0, 77.13], [77.0, 77.19], [78.0, 99.91]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 32.0], ["moo", 21.75], ["livestock, farm animals, working animals", 20.92]]], "duration": [1.43, 0.46, 0.13, 0.19, 21.91]} \ No newline at end of file diff --git a/annotations_filtered/uBP8cPLPWrQ_filtered.json b/annotations_filtered/uBP8cPLPWrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f279e5f93e9b9ecef6498934d901ea43285599fd --- /dev/null +++ b/annotations_filtered/uBP8cPLPWrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.29], [16.0, 18.93], [23.0, 23.55], [26.0, 26.1], [27.0, 29.24], [32.0, 31.94], [35.0, 48.9], [66.0, 66.31], [68.0, 71.51], [73.0, 74.55], [75.0, 76.65], [78.0, 78.95], [79.0, 81.57], [88.0, 88.06], [90.0, 90.73], [92.0, 92.64], [98.0, 98.81], [100.0, 128.06], [133.0, 135.65], [136.0, 137.02], [138.0, 138.18], [139.0, 141.61], [163.0, 163.71], [166.0, 166.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.0, 0.0, 0.0, 55.39, 0.0, 60.23, 0.0, 91.47, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 44.12, 42.86, 0.0, 0.0, 65.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.19], ["thunk", 34.03], ["guitar", 2.7]], [["music", 53.04], ["didgeridoo", 22.27], ["musical instrument", 3.69]], null, null, null, null, null], "duration": [0.29, 2.93, 0.55, 0.1, 2.24, -0.06, 13.9, 0.31, 3.51, 1.55, 1.65, 0.95, 2.57, 0.06, 0.73, 0.64, 0.81, 28.06, 2.65, 1.02, 0.18, 2.61, 0.71, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/uBPs4AHD52Y_filtered.json b/annotations_filtered/uBPs4AHD52Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85b8a48d47266eeacdad36dafd04ddc5802eb594 --- /dev/null +++ b/annotations_filtered/uBPs4AHD52Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.3], [22.0, 21.9], [31.0, 31.68], [33.0, 33.44], [40.0, 40.81], [43.0, 48.73], [58.0, 57.77], [60.0, 60.27], [62.0, 62.78], [65.0, 65.06], [66.0, 66.34], [69.0, 69.7], [71.0, 71.22], [75.0, 74.88], [76.0, 76.52], [83.0, 83.19], [85.0, 85.89], [92.0, 92.53], [94.0, 95.71], [100.0, 100.92], [111.0, 111.59], [114.0, 114.44], [115.0, 115.67], [118.0, 124.11], [125.0, 125.47]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.44], ["whack, thwack", 11.93], ["speech", 3.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.78], ["speech", 8.98], ["thunk", 8.16]], null], "duration": [0.3, -0.1, 0.68, 0.44, 0.81, 5.73, -0.23, 0.27, 0.78, 0.06, 0.34, 0.7, 0.22, -0.12, 0.52, 0.19, 0.89, 0.53, 1.71, 0.92, 0.59, 0.44, 0.67, 6.11, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/uBf-pbxHb7Y_filtered.json b/annotations_filtered/uBf-pbxHb7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd75821561ec0cc0e19b4f818d66650610e9904d --- /dev/null +++ b/annotations_filtered/uBf-pbxHb7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [11.0, 13.61], [14.0, 15.77], [18.0, 20.12], [21.0, 21.88], [23.0, 24.66], [26.0, 27.57], [28.0, 29.76], [33.0, 33.37], [35.0, 35.67], [37.0, 37.96], [39.0, 45.27], [47.0, 49.98], [54.0, 54.48], [58.0, 59.32], [61.0, 62.36], [63.0, 66.8], [68.0, 68.15], [69.0, 70.06], [72.0, 76.01], [83.0, 83.05], [84.0, 84.65], [86.0, 87.1], [89.0, 89.75], [91.0, 92.75], [93.0, 96.33], [100.0, 100.58]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 43.69, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.68, 41.46, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 0.0], "audiomae_on_audioset": [null, [["speech", 62.45], ["hum", 2.72], ["inside, small room", 2.54]], null, null, null, null, null, null, null, null, null, [["hum", 38.53], ["mains hum", 20.86], ["radio", 12.53]], [["fart", 30.5], ["whip", 12.27], ["speech", 10.9]], null, null, null, [["speech", 21.83], ["fly, housefly", 7.56], ["reverberation", 5.5]], null, null, null, null, null, null, null, null, [["fart", 13.46], ["speech", 6.08], ["boat, water vehicle", 4.8]], null], "duration": [0.24, 2.61, 1.77, 2.12, 0.88, 1.66, 1.57, 1.76, 0.37, 0.67, 0.96, 6.27, 2.98, 0.48, 1.32, 1.36, 3.8, 0.15, 1.06, 4.01, 0.05, 0.65, 1.1, 0.75, 1.75, 3.33, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/uBiewQrpBBA_filtered.json b/annotations_filtered/uBiewQrpBBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2f030c54ddd2e70a7d48f11aa17337ba87e4d56 --- /dev/null +++ b/annotations_filtered/uBiewQrpBBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.91], [9.0, 11.48], [12.0, 17.24], [19.0, 21.34], [24.0, 25.34], [27.0, 29.12], [30.0, 33.93], [36.0, 37.4], [39.0, 41.52], [44.0, 44.56], [49.0, 50.03], [52.0, 53.03], [54.0, 55.63], [57.0, 58.14], [61.0, 62.95], [69.0, 69.3], [73.0, 73.99], [84.0, 84.43], [86.0, 86.68], [88.0, 89.65], [91.0, 91.81], [94.0, 99.06], [100.0, 108.21], [109.0, 113.24], [114.0, 115.89], [117.0, 118.15], [119.0, 124.23], [125.0, 126.67], [127.0, 129.73]], "keep_status": [true, true, true, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, true], "silence_prob": [32.11, 34.37, 30.18, 36.82, 0.0, 40.64, 32.37, 0.0, 32.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.31, 33.58, 32.5, 0.0, 0.0, 31.67, 0.0, 31.98], "audiomae_on_audioset": [[["music", 46.4], ["theremin", 7.02], ["musical instrument", 6.27]], [["music", 17.89], ["wind instrument, woodwind instrument", 10.5], ["speech", 6.43]], [["music", 36.36], ["hum", 15.39], ["throbbing", 8.28]], [["music", 32.23], ["hum", 12.79], ["gong", 7.78]], null, [["music", 46.79], ["gong", 9.56], ["musical instrument", 6.58]], [["music", 31.99], ["speech", 12.99], ["mains hum", 6.27]], null, [["music", 27.91], ["synthesizer", 11.5], ["musical instrument", 5.09]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.93], ["cello", 14.85], ["double bass", 8.49]], [["mains hum", 22.07], ["hum", 20.12], ["theremin", 15.99]], [["theremin", 33.07], ["music", 25.12], ["hum", 7.77]], null, null, [["music", 51.82], ["theremin", 16.18], ["effects unit", 3.98]], null, [["speech", 17.38], ["foghorn", 16.83], ["music", 14.95]]], "duration": [4.91, 2.48, 5.24, 2.34, 1.34, 2.12, 3.93, 1.4, 2.52, 0.56, 1.03, 1.03, 1.63, 1.14, 1.95, 0.3, 0.99, 0.43, 0.68, 1.65, 0.81, 5.06, 8.21, 4.24, 1.89, 1.15, 5.23, 1.67, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/uBrvKhAs4S4_filtered.json b/annotations_filtered/uBrvKhAs4S4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uBrvKhAs4S4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uC1Lmk5qK2Q_filtered.json b/annotations_filtered/uC1Lmk5qK2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5608af7de897106fc51404388f17caa1905141e1 --- /dev/null +++ b/annotations_filtered/uC1Lmk5qK2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.57], [11.0, 18.66], [20.0, 20.78], [39.0, 39.82], [41.0, 42.08], [44.0, 44.83], [47.0, 47.7], [55.0, 56.83], [58.0, 58.78], [61.0, 64.93], [71.0, 91.18], [93.0, 93.72], [106.0, 107.16], [121.0, 122.12]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.91, 32.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.93], ["speech", 13.21], ["fly, housefly", 4.69]], null, null, null, null, null, null, null, [["music", 41.58], ["speech", 6.62], ["sidetone", 5.77]], [["music", 79.95], ["didgeridoo", 4.68], ["electronic music", 1.66]], null, null, null], "duration": [1.57, 7.66, 0.78, 0.82, 1.08, 0.83, 0.7, 1.83, 0.78, 3.93, 20.18, 0.72, 1.16, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/uCCrethRf3E_filtered.json b/annotations_filtered/uCCrethRf3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e150eaae1caa7b29361235cd5b4f47a2905bb041 --- /dev/null +++ b/annotations_filtered/uCCrethRf3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.33], [43.0, 48.36], [49.0, 49.71], [51.0, 52.17], [53.0, 53.6], [54.0, 55.11], [56.0, 56.29], [63.0, 63.8], [65.0, 65.82], [68.0, 68.91], [72.0, 75.27], [79.0, 80.23], [89.0, 89.78], [96.0, 97.77], [101.0, 103.25], [105.0, 105.46], [107.0, 108.16], [113.0, 113.46], [115.0, 115.08], [116.0, 117.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.48, 0.0, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 40.5], ["speech", 12.73], ["electronic music", 10.21]], null, null, null, null, null, null, null, null, [["music", 36.28], ["techno", 8.51], ["hum", 5.4]], null, null, null, [["music", 42.32], ["electronic music", 10.13], ["throbbing", 8.79]], null, null, null, null, null], "duration": [0.33, 5.36, 0.71, 1.17, 0.6, 1.11, 0.29, 0.8, 0.82, 0.91, 3.27, 1.23, 0.78, 1.77, 2.25, 0.46, 1.16, 0.46, 0.08, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/uCG1EiqEAEg_filtered.json b/annotations_filtered/uCG1EiqEAEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dff39f10b8ba9f27272b513a028222f048570def --- /dev/null +++ b/annotations_filtered/uCG1EiqEAEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.57], [16.0, 18.55], [20.0, 24.17], [28.0, 31.38], [37.0, 37.29], [39.0, 39.55], [40.0, 47.49], [50.0, 50.82], [55.0, 55.14], [56.0, 56.93], [62.0, 62.34], [66.0, 66.93], [68.0, 70.01], [71.0, 71.78], [73.0, 72.84], [75.0, 90.61], [92.0, 97.55], [98.0, 100.33], [102.0, 102.64], [104.0, 115.21], [118.0, 119.53]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, true, true, false, true, false], "silence_prob": [94.37, 58.55, 36.8, 29.99, 0.0, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 41.14, 33.07, 42.62, 0.0, 44.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 21.42], ["breaking", 12.33], ["arrow", 8.09]], [["music", 28.3], ["theremin", 11.01], ["hum", 7.59]], null, null, [["whale vocalization", 26.96], ["speech", 20.13], ["mains hum", 18.36]], null, null, null, null, null, [["hum", 20.61], ["mains hum", 8.41], ["music", 7.15]], null, null, [["hum", 53.34], ["mains hum", 14.99], ["music", 14.16]], [["speech", 18.36], ["hum", 16.0], ["music", 12.93]], [["music", 26.39], ["didgeridoo", 23.21], ["hum", 10.23]], null, [["music", 58.77], ["ambient music", 6.34], ["throbbing", 2.96]], null], "duration": [6.57, 2.55, 4.17, 3.38, 0.29, 0.55, 7.49, 0.82, 0.14, 0.93, 0.34, 0.93, 2.01, 0.78, -0.16, 15.61, 5.55, 2.33, 0.64, 11.21, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/uCMat1QDt6k_filtered.json b/annotations_filtered/uCMat1QDt6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2aedb6eff92ec0cae80151d689b0429ba01aeef --- /dev/null +++ b/annotations_filtered/uCMat1QDt6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.8], [18.0, 19.8], [21.0, 22.05], [23.0, 31.94], [33.0, 35.68], [36.0, 39.26], [43.0, 52.15], [58.0, 62.51], [63.0, 65.48], [70.0, 72.91], [78.0, 91.79], [96.0, 98.19], [98.0, 99.25]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.16, 41.81, 39.64, 43.64, 52.92, 53.28, 53.97, 63.53, 51.23, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 64.92], ["theremin", 5.18], ["foghorn", 2.55]], [["speech", 31.18], ["music", 30.11], ["foghorn", 7.19]], [["music", 55.4], ["hum", 11.01], ["scary music", 7.49]], null, null, null, null, null, null], "duration": [1.8, 1.8, 1.05, 8.94, 2.68, 3.26, 9.15, 4.51, 2.48, 2.91, 13.79, 2.19, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/uCV1-C_0vC8_filtered.json b/annotations_filtered/uCV1-C_0vC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a86d02365b27bd3f7e9bd70ad72d687074d3d13d --- /dev/null +++ b/annotations_filtered/uCV1-C_0vC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [13.0, 14.28], [16.0, 16.93], [22.0, 22.92], [23.0, 23.68], [24.0, 24.83], [25.0, 27.82], [28.0, 30.6], [32.0, 32.43], [35.0, 37.4], [46.0, 47.98], [49.0, 52.64], [55.0, 57.45], [58.0, 59.48], [62.0, 62.16], [63.0, 63.39], [65.0, 65.72], [70.0, 70.36], [71.0, 71.61], [73.0, 72.99], [84.0, 85.38]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 45.92, 0.0, 51.82, 0.0, 97.73, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 13.05], ["hum", 12.03], ["throbbing", 11.35]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.28, 0.93, 0.92, 0.68, 0.83, 2.82, 2.6, 0.43, 2.4, 1.98, 3.64, 2.45, 1.48, 0.16, 0.39, 0.72, 0.36, 0.61, -0.01, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/uCZStp0Z_xg_filtered.json b/annotations_filtered/uCZStp0Z_xg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9043a10351b93a11f741ef0e3a966231f2d32d73 --- /dev/null +++ b/annotations_filtered/uCZStp0Z_xg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 59.05], [60.0, 100.72], [101.0, 103.37], [105.0, 122.76], [124.0, 124.71], [126.0, 127.36]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.78, 35.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 64.66], ["speech", 9.84], ["timpani", 6.19]], null, null], "duration": [1.05, 40.72, 2.37, 17.76, 0.71, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/uCsRqsNpF60_filtered.json b/annotations_filtered/uCsRqsNpF60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8dc9849b657da5770e28736e11a4981e0b245cb --- /dev/null +++ b/annotations_filtered/uCsRqsNpF60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [5.0, 5.91], [7.0, 7.7], [9.0, 14.72], [16.0, 32.34], [37.0, 38.94], [41.0, 57.96], [60.0, 66.82], [69.0, 73.68], [76.0, 78.02], [82.0, 89.14], [91.0, 91.49], [93.0, 100.23], [106.0, 111.28], [112.0, 111.89], [113.0, 116.8], [117.0, 116.83], [117.0, 116.97], [119.0, 119.74], [124.0, 126.62], [130.0, 147.24], [150.0, 160.66]], "keep_status": [false, false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.45, 41.2, 0.0, 40.7, 61.27, 36.15, 46.02, 41.74, 0.0, 40.14, 54.1, 0.0, 43.1, 0.0, 0.0, 0.0, 75.88, 35.16, 34.91], "audiomae_on_audioset": [null, null, null, [["music", 22.82], ["throbbing", 19.03], ["sidetone", 11.65]], [["music", 47.48], ["hum", 20.96], ["mains hum", 7.28]], null, [["music", 36.05], ["hum", 14.87], ["speech", 7.99]], null, [["music", 43.19], ["whack, thwack", 7.44], ["sigh", 4.12]], [["music", 49.86], ["throbbing", 24.09], ["hum", 6.06]], [["throbbing", 33.16], ["music", 21.95], ["moo", 7.5]], null, [["thunk", 85.71], ["music", 6.95], ["door", 1.45]], null, null, [["music", 46.87], ["speech", 15.14], ["didgeridoo", 9.21]], null, null, null, null, [["music", 52.93], ["whack, thwack", 18.01], ["throbbing", 3.81]], [["mains hum", 49.45], ["hum", 31.88], ["music", 7.06]]], "duration": [0.5, 0.91, 0.7, 5.72, 16.34, 1.94, 16.96, 6.82, 4.68, 2.02, 7.14, 0.49, 7.23, 5.28, -0.11, 3.8, -0.17, -0.03, 0.74, 2.62, 17.24, 10.66]} \ No newline at end of file diff --git a/annotations_filtered/uCtMTbKX6_I_filtered.json b/annotations_filtered/uCtMTbKX6_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5e274e86820f81f704af33f7430af3ed3007830 --- /dev/null +++ b/annotations_filtered/uCtMTbKX6_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.44], [28.0, 40.37], [51.0, 51.27], [62.0, 62.29], [65.0, 65.16], [81.0, 80.89], [86.0, 86.68], [92.0, 91.84], [96.0, 96.01], [98.0, 98.04], [101.0, 101.87], [103.0, 103.69], [104.0, 104.89], [106.0, 107.25], [109.0, 109.11], [112.0, 113.86], [118.0, 118.1], [121.0, 121.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.38, 34.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 77.75], ["musical instrument", 2.55], ["guitar", 1.52]], [["music", 66.2], ["speech", 5.36], ["didgeridoo", 2.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.44, 12.37, 0.27, 0.29, 0.16, -0.11, 0.68, -0.16, 0.01, 0.04, 0.87, 0.69, 0.89, 1.25, 0.11, 1.86, 0.1, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/uD2mdsAwJBA_filtered.json b/annotations_filtered/uD2mdsAwJBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ffd79554819a7e4d3a8a442a33163f1ef92bddf --- /dev/null +++ b/annotations_filtered/uD2mdsAwJBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.27], [14.0, 14.98], [17.0, 24.0], [29.0, 31.43], [36.0, 38.8], [53.0, 54.84], [65.0, 94.31], [104.0, 114.88]], "keep_status": [false, false, false, true, true, false, false, false], "silence_prob": [32.96, 0.0, 35.48, 46.4, 42.91, 0.0, 33.13, 32.56], "audiomae_on_audioset": [[["music", 58.23], ["boing", 15.17], ["echo", 3.34]], null, [["music", 75.77], ["musical instrument", 2.0], ["speech", 1.61]], [["music", 42.81], ["echo", 6.53], ["synthesizer", 5.92]], [["music", 49.18], ["trombone", 6.33], ["foghorn", 6.03]], null, [["music", 81.79], ["trombone", 5.06], ["brass instrument", 5.03]], [["music", 87.82], ["swing music", 2.87], ["yodeling", 1.34]]], "duration": [5.27, 0.98, 7.0, 2.43, 2.8, 1.84, 29.31, 10.88]} \ No newline at end of file diff --git a/annotations_filtered/uDAIoSeEoZA_filtered.json b/annotations_filtered/uDAIoSeEoZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0bc8fafbf9c8c39b3e43a3ba3fb6f70a7bcacac --- /dev/null +++ b/annotations_filtered/uDAIoSeEoZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.05], [11.0, 11.23], [19.0, 21.56], [38.0, 38.43], [44.0, 45.62], [47.0, 47.95], [54.0, 53.77], [55.0, 55.26], [57.0, 57.75], [62.0, 62.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bee, wasp, etc.", 25.33], ["fly, housefly", 15.28], ["speech", 13.99]], null, null, null, null, null, null, null], "duration": [0.05, 0.23, 2.56, 0.43, 1.62, 0.95, -0.23, 0.26, 0.75, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/uDISBx2Ry7s_filtered.json b/annotations_filtered/uDISBx2Ry7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b19a57c954188173229ee90adbf10396a0084bed --- /dev/null +++ b/annotations_filtered/uDISBx2Ry7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.0], [20.0, 26.28], [32.0, 35.18], [36.0, 37.08], [41.0, 42.92], [45.0, 45.84], [57.0, 57.59], [58.0, 59.32], [61.0, 67.37], [69.0, 69.84], [70.0, 72.17], [90.0, 91.89], [92.0, 98.05], [99.0, 100.48], [101.0, 107.91], [110.0, 113.22], [117.0, 121.2], [122.0, 126.37]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [35.57, 40.24, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 38.08, 0.0, 55.81, 0.0, 70.72, 0.0, 83.88, 70.72, 95.78, 64.41], "audiomae_on_audioset": [[["hum", 16.38], ["whack, thwack", 12.36], ["mains hum", 6.63]], [["speech", 23.83], ["mains hum", 16.29], ["bee, wasp, etc.", 12.56]], null, null, null, null, null, null, [["rowboat, canoe, kayak", 21.94], ["fly, housefly", 7.88], ["boat, water vehicle", 6.0]], null, null, null, null, null, null, null, null, null], "duration": [12.0, 6.28, 3.18, 1.08, 1.92, 0.84, 0.59, 1.32, 6.37, 0.84, 2.17, 1.89, 6.05, 1.48, 6.91, 3.22, 4.2, 4.37]} \ No newline at end of file diff --git a/annotations_filtered/uDJsCE01LYI_filtered.json b/annotations_filtered/uDJsCE01LYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f90ab34d60544bc9c45059e557e508fd7995dad --- /dev/null +++ b/annotations_filtered/uDJsCE01LYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [16.0, 17.63], [32.0, 33.52], [34.0, 35.34], [37.0, 37.42], [39.0, 40.07], [43.0, 43.09], [44.0, 44.25], [46.0, 47.06], [49.0, 52.15], [53.0, 60.22], [61.0, 61.7], [62.0, 65.33], [66.0, 66.56], [67.0, 66.6], [67.0, 67.07], [77.0, 77.19], [84.0, 84.55], [86.0, 86.39], [90.0, 94.36], [95.0, 95.55], [97.0, 97.16], [104.0, 111.47], [114.0, 114.66], [120.0, 122.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.29, 62.37, 0.0, 41.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.68, 0.0, 0.0, 29.8, 0.0, 34.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fart", 38.78], ["speech", 36.23], ["crushing", 7.83]], null, null, [["speech", 52.12], ["fart", 22.29], ["reverberation", 3.47]], null, null, null, null, null, null, [["music", 57.06], ["fart", 3.96], ["speech", 2.59]], null, null, [["music", 56.62], ["speech", 9.25], ["synthesizer", 6.11]], null, [["music", 37.65], ["speech", 13.49], ["didgeridoo", 4.19]]], "duration": [0.83, 1.63, 1.52, 1.34, 0.42, 1.07, 0.09, 0.25, 1.06, 3.15, 7.22, 0.7, 3.33, 0.56, -0.4, 0.07, 0.19, 0.55, 0.39, 4.36, 0.55, 0.16, 7.47, 0.66, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/uDffmOSVnBM_filtered.json b/annotations_filtered/uDffmOSVnBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33c6fc88f7dcbf417d85813f7254482bfc53cd7a --- /dev/null +++ b/annotations_filtered/uDffmOSVnBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.03], [21.0, 29.44], [32.0, 34.01], [71.0, 75.05], [79.0, 80.76], [107.0, 115.25], [141.0, 142.5], [156.0, 157.44], [160.0, 160.41], [161.0, 161.74]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [39.47, 30.22, 61.27, 28.78, 0.0, 28.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.85], ["synthesizer", 10.25], ["hum", 4.44]], [["speech", 33.55], ["music", 26.91], ["explosion", 4.37]], null, [["speech", 48.76], ["music", 9.64], ["breaking", 4.54]], null, [["speech", 61.22], ["explosion", 15.8], ["eruption", 4.87]], null, null, null, null], "duration": [8.03, 8.44, 2.01, 4.05, 1.76, 8.25, 1.5, 1.44, 0.41, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/uDimGOcZ24U_filtered.json b/annotations_filtered/uDimGOcZ24U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71cfc79bd919e6e08038e3a43ada36cd846a0dd9 --- /dev/null +++ b/annotations_filtered/uDimGOcZ24U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 4.58], [7.0, 8.41], [10.0, 10.47], [11.0, 12.72], [13.0, 21.34], [22.0, 22.28], [24.0, 28.93], [30.0, 33.29], [35.0, 35.5], [38.0, 41.4], [41.0, 41.44], [53.0, 53.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.53, 0.0, 30.53, 32.43, 0.0, 34.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.96], ["speech", 19.46], ["fly, housefly", 3.21]], null, [["music", 70.96], ["throbbing", 4.82], ["electronic music", 3.62]], [["music", 67.83], ["speech", 9.33], ["hum", 3.14]], null, [["music", 68.21], ["speech", 9.91], ["electronic music", 3.57]], null, null], "duration": [1.56, 0.58, 1.41, 0.47, 1.72, 8.34, 0.28, 4.93, 3.29, 0.5, 3.4, 0.44, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/uDqSQGOtixE_filtered.json b/annotations_filtered/uDqSQGOtixE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2a42408e10ff00279cd250d0455c8e38bf36a91 --- /dev/null +++ b/annotations_filtered/uDqSQGOtixE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.44], [17.0, 19.13], [22.0, 22.42], [32.0, 33.47], [34.0, 34.21], [47.0, 48.12], [54.0, 55.02], [59.0, 59.53], [66.0, 65.94], [83.0, 83.67], [88.0, 89.18], [97.0, 97.34]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.49, 40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 30.47], ["cattle, bovinae", 29.3], ["livestock, farm animals, working animals", 28.2]], [["music", 32.69], ["musical instrument", 8.78], ["speech", 6.49]], null, null, null, null, null, null, null, null, null, null], "duration": [6.44, 2.13, 0.42, 1.47, 0.21, 1.12, 1.02, 0.53, -0.06, 0.67, 1.18, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/uDr8qT3BlHM_filtered.json b/annotations_filtered/uDr8qT3BlHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..848fe21c5340492dd0ae2c4ca6fa3ceb02074b17 --- /dev/null +++ b/annotations_filtered/uDr8qT3BlHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.15], [22.0, 23.23], [25.0, 25.02], [28.0, 29.0], [36.0, 35.55], [37.0, 37.42], [41.0, 41.79], [43.0, 43.48], [45.0, 48.14], [49.0, 49.87], [53.0, 54.06], [55.0, 66.16], [68.0, 70.31], [71.0, 71.19], [77.0, 78.81], [79.0, 80.37], [81.0, 80.92], [83.0, 86.78], [89.0, 92.03], [97.0, 101.01], [104.0, 104.79], [106.0, 106.3], [108.0, 110.94], [117.0, 119.08], [119.0, 120.85], [126.0, 129.81], [130.0, 129.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 99.96, 97.43, 0.0, 0.0, 0.0, 0.0, 100.0, 87.55, 94.81, 0.0, 0.0, 100.0, 99.87, 0.0, 99.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.15, 1.23, 0.02, 1.0, -0.45, 0.42, 0.79, 0.48, 3.14, 0.87, 1.06, 11.16, 2.31, 0.19, 1.81, 1.37, -0.08, 3.78, 3.03, 4.01, 0.79, 0.3, 2.94, 2.08, 1.85, 3.81, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/uE-l84hG_BE_filtered.json b/annotations_filtered/uE-l84hG_BE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8f3aef999b5233af64cf44fefdfec51601a295 --- /dev/null +++ b/annotations_filtered/uE-l84hG_BE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.72], [16.0, 17.86], [24.0, 37.88], [42.0, 43.16], [48.0, 48.14], [49.0, 53.43], [54.0, 54.73], [55.0, 55.9], [57.0, 57.97], [58.0, 59.05], [61.0, 60.98], [72.0, 73.45], [94.0, 97.82], [101.0, 101.75], [107.0, 107.77], [109.0, 109.36], [112.0, 114.25], [116.0, 117.0], [125.0, 125.05], [138.0, 139.51], [142.0, 142.55], [145.0, 144.91], [146.0, 150.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.04, 0.0, 0.0, 33.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0, 0.0, 0.0, 40.17, 0.0, 0.0, 0.0, 0.0, 0.0, 53.4], "audiomae_on_audioset": [null, null, [["music", 55.03], ["musical instrument", 8.43], ["speech", 6.57]], null, null, [["speech", 45.54], ["thunk", 17.41], ["music", 14.67]], null, null, null, null, null, null, [["music", 71.73], ["didgeridoo", 18.79], ["musical instrument", 3.63]], null, null, null, [["music", 54.88], ["synthesizer", 7.8], ["speech", 7.23]], null, null, null, null, null, null], "duration": [0.72, 1.86, 13.88, 1.16, 0.14, 4.43, 0.73, 0.9, 0.97, 1.05, -0.02, 1.45, 3.82, 0.75, 0.77, 0.36, 2.25, 1.0, 0.05, 1.51, 0.55, -0.09, 4.43]} \ No newline at end of file diff --git a/annotations_filtered/uE0DBpw09SU_filtered.json b/annotations_filtered/uE0DBpw09SU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09a7e170af21e10434ad407510c5ca7a266b0b17 --- /dev/null +++ b/annotations_filtered/uE0DBpw09SU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [8.0, 9.61], [12.0, 12.28], [13.0, 13.58], [19.0, 18.84], [23.0, 23.57], [24.0, 25.42], [26.0, 31.11], [35.0, 62.9], [64.0, 110.42], [111.0, 115.92], [116.0, 119.31], [120.0, 120.66], [122.0, 125.04], [126.0, 127.18], [127.0, 129.69], [131.0, 132.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 81.53, 0.0, 49.64, 38.28, 0.0, 77.87, 0.0, 65.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 22.08], ["didgeridoo", 17.03], ["speech", 16.81]], [["speech", 52.27], ["music", 9.83], ["sidetone", 4.15]], null, null, null, null, null], "duration": [0.97, 1.61, 0.28, 0.58, -0.16, 0.57, 1.42, 5.11, 27.9, 46.42, 4.92, 3.31, 0.66, 3.04, 1.18, 2.69, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/uE8yYJmpxeI_filtered.json b/annotations_filtered/uE8yYJmpxeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b79a86137bd0360c6d867a3057f0dcc864e31fff --- /dev/null +++ b/annotations_filtered/uE8yYJmpxeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 31.21], [34.0, 48.57], [49.0, 55.95], [58.0, 64.23], [65.0, 83.37], [86.0, 99.1], [100.0, 120.11], [122.0, 123.57], [126.0, 126.27], [127.0, 130.08], [132.0, 132.87], [134.0, 134.4], [142.0, 143.56], [146.0, 148.26]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.01, 49.92, 31.08, 33.05, 38.11, 29.98, 42.55, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 98.86], "audiomae_on_audioset": [[["music", 37.13], ["theremin", 15.07], ["synthesizer", 10.69]], [["music", 49.78], ["thunk", 8.65], ["theremin", 7.45]], [["fly, housefly", 46.2], ["mosquito", 26.24], ["insect", 11.99]], [["speech", 49.44], ["hum", 12.54], ["music", 10.33]], [["quack", 39.79], ["music", 36.47], ["duck", 6.17]], [["music", 57.1], ["whale vocalization", 22.43], ["sound effect", 1.99]], [["music", 49.13], ["bow-wow", 12.11], ["animal", 11.62]], null, null, null, null, null, null, null], "duration": [26.21, 14.57, 6.95, 6.23, 18.37, 13.1, 20.11, 1.57, 0.27, 3.08, 0.87, 0.4, 1.56, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/uEJ_Ak34ias_filtered.json b/annotations_filtered/uEJ_Ak34ias_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..472a16324735bfab4ebb1cc945df9a0e3c723d4a --- /dev/null +++ b/annotations_filtered/uEJ_Ak34ias_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.87], [5.0, 5.36], [5.0, 5.73], [7.0, 8.28], [12.0, 18.25], [19.0, 19.9], [21.0, 21.66], [23.0, 23.95], [26.0, 26.5], [29.0, 35.55], [39.0, 41.86], [43.0, 43.38], [45.0, 45.93], [48.0, 48.27], [50.0, 50.67], [51.0, 56.84], [58.0, 58.19], [58.0, 60.88], [62.0, 65.92], [72.0, 73.33], [77.0, 78.14], [79.0, 79.73], [81.0, 82.19], [83.0, 86.09], [87.0, 92.79], [93.0, 97.75], [98.0, 99.22], [100.0, 100.53], [103.0, 104.33], [105.0, 107.52], [108.0, 110.52], [111.0, 115.1], [116.0, 125.1], [126.0, 126.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 57.32, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 96.77, 95.91, 0.0, 0.0, 0.0, 32.19, 100.0, 100.0, 39.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 26.93], ["speech", 13.24], ["livestock, farm animals, working animals", 10.32]], null, null, [["speech", 54.69], ["music", 11.3], ["inside, small room", 2.63]], null], "duration": [-0.13, 0.36, 0.73, 1.28, 6.25, 0.9, 0.66, 0.95, 0.5, 6.55, 2.86, 0.38, 0.93, 0.27, 0.67, 5.84, 0.19, 2.88, 3.92, 1.33, 1.14, 0.73, 1.19, 3.09, 5.79, 4.75, 1.22, 0.53, 1.33, 2.52, 2.52, 4.1, 9.1, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/uEMTQYe1ro0_filtered.json b/annotations_filtered/uEMTQYe1ro0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54eb56bd12da0a3f62c9ff06e066a790f121dfa0 --- /dev/null +++ b/annotations_filtered/uEMTQYe1ro0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.63], [47.0, 47.07], [47.0, 63.66], [72.0, 76.45], [78.0, 108.84], [109.0, 110.03], [110.0, 115.77], [117.0, 175.98], [179.0, 221.71], [223.0, 224.38]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [35.51, 0.0, 30.45, 29.91, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.37], ["sine wave", 4.11], ["singing bowl", 3.78]], null, [["music", 75.84], ["musical instrument", 3.02], ["hum", 1.47]], [["fly, housefly", 30.99], ["mosquito", 30.9], ["mains hum", 5.8]], null, null, [["music", 73.07], ["rumble", 3.92], ["roaring cats (lions, tigers)", 3.92]], null, null, null], "duration": [21.63, 0.07, 16.66, 4.45, 30.84, 1.03, 5.77, 58.98, 42.71, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/uETwKF_fgKw_filtered.json b/annotations_filtered/uETwKF_fgKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b721b8052d8d11704cdeb97b659fd3e5210de13 --- /dev/null +++ b/annotations_filtered/uETwKF_fgKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.93], [23.0, 30.89], [33.0, 36.26], [39.0, 40.54], [41.0, 41.27], [42.0, 42.3], [44.0, 44.78], [45.0, 63.37], [68.0, 69.92], [74.0, 74.38], [76.0, 76.57], [78.0, 86.56], [89.0, 93.02], [95.0, 135.94], [136.0, 138.0], [142.0, 142.37], [148.0, 148.37], [155.0, 159.92], [169.0, 168.91], [169.0, 187.44], [190.0, 200.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.07, 32.43, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 0.0, 31.57, 30.36, 0.0, 30.85, 0.0, 0.0, 30.95, 0.0, 30.74, 31.32], "audiomae_on_audioset": [null, [["music", 60.96], ["didgeridoo", 12.62], ["musical instrument", 7.85]], [["music", 43.94], ["didgeridoo", 11.52], ["synthesizer", 5.88]], null, null, null, null, [["music", 79.28], ["synthesizer", 3.37], ["thunk", 2.74]], null, null, null, [["music", 83.92], ["wind instrument, woodwind instrument", 2.31], ["musical instrument", 1.54]], [["music", 60.95], ["didgeridoo", 5.56], ["wind instrument, woodwind instrument", 4.22]], null, [["music", 57.39], ["boing", 13.85], ["quack", 4.87]], null, null, [["music", 53.71], ["speech", 11.34], ["clarinet", 8.56]], null, [["music", 80.01], ["speech", 2.75], ["quack", 2.11]], [["music", 61.9], ["wind instrument, woodwind instrument", 16.84], ["harmonica", 4.76]]], "duration": [0.93, 7.89, 3.26, 1.54, 0.27, 0.3, 0.78, 18.37, 1.92, 0.38, 0.57, 8.56, 4.02, 40.94, 2.0, 0.37, 0.37, 4.92, -0.09, 18.44, 10.04]} \ No newline at end of file diff --git a/annotations_filtered/uEV9jxF2tOo_filtered.json b/annotations_filtered/uEV9jxF2tOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..212813ed2450498d39a65d3bbabd7a017a3faef2 --- /dev/null +++ b/annotations_filtered/uEV9jxF2tOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.93], [6.0, 7.91], [9.0, 10.4], [11.0, 12.77], [15.0, 39.16], [43.0, 45.89], [47.0, 48.2], [52.0, 72.01]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [60.32, 0.0, 0.0, 0.0, 29.89, 30.86, 0.0, 29.92], "audiomae_on_audioset": [null, null, null, null, [["speech", 54.04], ["music", 16.71], ["hum", 4.78]], [["music", 61.57], ["speech", 13.92], ["sidetone", 6.58]], null, [["speech", 40.08], ["music", 33.74], ["whack, thwack", 6.4]]], "duration": [3.93, 1.91, 1.4, 1.77, 24.16, 2.89, 1.2, 20.01]} \ No newline at end of file diff --git a/annotations_filtered/uEW0FlmiNec_filtered.json b/annotations_filtered/uEW0FlmiNec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d3e92273d6fe0783096a07d1d15c87e9730146 --- /dev/null +++ b/annotations_filtered/uEW0FlmiNec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [10.0, 10.76], [14.0, 16.8], [19.0, 21.02], [24.0, 24.51], [28.0, 29.03], [30.0, 30.92], [33.0, 33.54], [40.0, 41.12], [42.0, 43.5], [44.0, 44.85], [47.0, 50.9], [52.0, 53.42], [57.0, 58.13], [59.0, 60.72], [64.0, 67.1], [75.0, 76.42], [85.0, 87.2], [90.0, 90.19], [92.0, 95.2], [103.0, 105.51], [111.0, 112.45], [118.0, 117.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.21, 39.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 53.22, 0.0, 60.42, 0.0, 43.15, 71.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 30.28], ["speech", 28.02], ["synthesizer", 12.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.33], ["speech", 19.03], ["didgeridoo", 10.35]], null, null, null], "duration": [0.49, 0.76, 2.8, 2.02, 0.51, 1.03, 0.92, 0.54, 1.12, 1.5, 0.85, 3.9, 1.42, 1.13, 1.72, 3.1, 1.42, 2.2, 0.19, 3.2, 2.51, 1.45, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/uEYm9Zm5zI8_filtered.json b/annotations_filtered/uEYm9Zm5zI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..359d9344931ac5c8eec4dd3520e2041613a72926 --- /dev/null +++ b/annotations_filtered/uEYm9Zm5zI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [14.0, 15.31], [16.0, 17.42], [20.0, 34.57], [38.0, 43.78], [50.0, 58.11]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.9, 31.44, 34.93], "audiomae_on_audioset": [null, null, null, [["speech", 31.12], ["whack, thwack", 11.71], ["music", 6.52]], [["speech", 32.76], ["music", 25.93], ["sidetone", 13.03]], [["hum", 38.02], ["throbbing", 26.18], ["speech", 12.58]]], "duration": [0.0, 1.31, 1.42, 14.57, 5.78, 8.11]} \ No newline at end of file diff --git a/annotations_filtered/uE_EjcgtiVI_filtered.json b/annotations_filtered/uE_EjcgtiVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c9afb1d524fe060ec33943bf798bccb28e7eb1f --- /dev/null +++ b/annotations_filtered/uE_EjcgtiVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [5.0, 5.48], [17.0, 18.39], [30.0, 31.65], [43.0, 44.58], [52.0, 59.44], [71.0, 72.01], [72.0, 72.05], [84.0, 85.72], [94.0, 95.5], [96.0, 98.91], [110.0, 111.99], [114.0, 115.18], [118.0, 118.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.07, 0.0, 0.0, 0.0, 0.0, 33.24, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 63.75], ["musical instrument", 4.11], ["theremin", 3.79]], null, null, null, null, [["music", 78.25], ["trombone", 3.06], ["brass instrument", 1.9]], null, null, null], "duration": [0.31, 0.48, 1.39, 1.65, 1.58, 7.44, 1.01, 0.05, 1.72, 1.5, 2.91, 1.99, 1.18, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/uF7ftHMCN1w_filtered.json b/annotations_filtered/uF7ftHMCN1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..674b59251f223d2ca196a767c37e9cedbcd08061 --- /dev/null +++ b/annotations_filtered/uF7ftHMCN1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.58], [26.0, 26.18], [35.0, 36.76], [48.0, 47.73], [53.0, 52.88], [58.0, 59.46], [66.0, 69.45], [70.0, 72.32], [73.0, 74.85], [77.0, 77.48], [79.0, 80.23], [81.0, 83.98], [86.0, 86.19], [87.0, 87.91], [90.0, 90.39], [98.0, 100.9], [104.0, 103.79], [107.0, 108.24], [111.0, 111.62], [117.0, 117.8], [118.0, 120.24], [122.0, 122.45], [123.0, 122.69], [123.0, 123.72], [124.0, 124.51], [126.0, 126.67], [127.0, 128.66], [133.0, 133.84], [137.0, 138.16], [139.0, 139.26], [141.0, 141.72], [144.0, 145.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 93.76, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 33.42, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 40.5], ["cattle, bovinae", 38.51], ["livestock, farm animals, working animals", 13.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.18, 1.76, -0.27, -0.12, 1.46, 3.45, 2.32, 1.85, 0.48, 1.23, 2.98, 0.19, 0.91, 0.39, 2.9, -0.21, 1.24, 0.62, 0.8, 2.24, 0.45, -0.31, 0.72, 0.51, 0.67, 1.66, 0.84, 1.16, 0.26, 0.72, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/uFHReMA18_c_filtered.json b/annotations_filtered/uFHReMA18_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe45c5375d8979420b038f2a81ce0c88ccc20de4 --- /dev/null +++ b/annotations_filtered/uFHReMA18_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [2.0, 2.05], [6.0, 6.71], [10.0, 10.52], [11.0, 11.53], [16.0, 16.26], [31.0, 33.79], [38.0, 41.5], [42.0, 48.14], [51.0, 51.7], [53.0, 54.13], [56.0, 62.5], [64.0, 72.52], [74.0, 74.41], [76.0, 77.95], [98.0, 101.82], [112.0, 114.4], [115.0, 116.4], [117.0, 118.18], [124.0, 124.92], [127.0, 127.82]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 32.89, 99.68, 0.0, 0.0, 90.95, 58.55, 0.0, 0.0, 94.66, 90.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 34.51], ["whack, thwack", 8.23], ["smash, crash", 4.9]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.05, 0.71, 0.52, 0.53, 0.26, 2.79, 3.5, 6.14, 0.7, 1.13, 6.5, 8.52, 0.41, 1.95, 3.82, 2.4, 1.4, 1.18, 0.92, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/uFNIrs3jtEQ_filtered.json b/annotations_filtered/uFNIrs3jtEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4120b3d226d54a86c4c8b51070e6644a7d773e8 --- /dev/null +++ b/annotations_filtered/uFNIrs3jtEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.23], [12.0, 13.14], [13.0, 17.0], [19.0, 19.4], [21.0, 21.59], [22.0, 23.16], [25.0, 26.42], [27.0, 28.05], [29.0, 29.59], [30.0, 31.83], [37.0, 37.03], [38.0, 38.99], [41.0, 42.75], [43.0, 44.19], [47.0, 49.44], [53.0, 55.49], [57.0, 60.64], [63.0, 63.59], [83.0, 84.28], [85.0, 86.04], [87.0, 87.03], [90.0, 90.71], [94.0, 94.63], [97.0, 99.77], [101.0, 100.89], [102.0, 102.32], [108.0, 109.16], [111.0, 110.89], [115.0, 116.82], [118.0, 117.96], [121.0, 122.67], [125.0, 127.6], [130.0, 135.9], [146.0, 147.88], [150.0, 150.13], [151.0, 150.7], [153.0, 154.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 100.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 42.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.87], ["telephone", 12.35], ["dial tone", 4.3]], null, null, null, null], "duration": [0.23, 1.14, 4.0, 0.4, 0.59, 1.16, 1.42, 1.05, 0.59, 1.83, 0.03, 0.99, 1.75, 1.19, 2.44, 2.49, 3.64, 0.59, 1.28, 1.04, 0.03, 0.71, 0.63, 2.77, -0.11, 0.32, 1.16, -0.11, 1.82, -0.04, 1.67, 2.6, 5.9, 1.88, 0.13, -0.3, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/uFTd09NNJzo_filtered.json b/annotations_filtered/uFTd09NNJzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec8c8e08b39e5a70785797f2d84891468e37f34f --- /dev/null +++ b/annotations_filtered/uFTd09NNJzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [8.0, 9.39], [11.0, 11.35], [15.0, 147.45], [151.0, 152.56]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.43, 1.39, 0.35, 132.45, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/uF_721BvdJE_filtered.json b/annotations_filtered/uF_721BvdJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62ac71d168416b973e8cabcddaba45b70b693255 --- /dev/null +++ b/annotations_filtered/uF_721BvdJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 51.49]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [39.49]} \ No newline at end of file diff --git a/annotations_filtered/uG_KHjd_PSc_filtered.json b/annotations_filtered/uG_KHjd_PSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b8f42cab7fc85ec23fba0679e377a74555d4a0 --- /dev/null +++ b/annotations_filtered/uG_KHjd_PSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [2.0, 2.32], [14.0, 17.58], [19.0, 20.85], [28.0, 32.46], [33.0, 36.81], [39.0, 40.54], [41.0, 42.33], [43.0, 44.02], [47.0, 48.32], [49.0, 50.13], [51.0, 51.81], [56.0, 55.98], [64.0, 65.43], [72.0, 72.55], [75.0, 91.39], [92.0, 93.97], [95.0, 95.69], [97.0, 96.92], [101.0, 104.45], [106.0, 112.36], [115.0, 115.77], [118.0, 118.25], [123.0, 124.29], [127.0, 130.89], [132.0, 133.35], [135.0, 135.01], [139.0, 138.81], [143.0, 145.74], [150.0, 151.34], [153.0, 154.01], [157.0, 157.17], [158.0, 158.3], [160.0, 162.13], [163.0, 163.49], [168.0, 168.84], [171.0, 172.25], [174.0, 177.45]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.85, 0.0, 36.78, 36.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.6, 0.0, 0.0, 0.0, 29.0, 29.03, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 52.27], "audiomae_on_audioset": [null, null, [["music", 67.49], ["musical instrument", 3.53], ["guitar", 2.31]], null, [["hum", 24.81], ["speech", 11.13], ["mains hum", 8.18]], [["hum", 33.5], ["speech", 16.44], ["mains hum", 6.58]], null, null, null, null, null, null, null, null, null, [["sonar", 25.86], ["music", 17.31], ["hum", 15.76]], null, null, null, [["speech", 23.75], ["music", 9.56], ["radio", 5.12]], [["music", 63.34], ["didgeridoo", 18.3], ["speech", 5.07]], null, null, null, [["speech", 50.48], ["throbbing", 12.62], ["music", 8.11]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.32, 3.58, 1.85, 4.46, 3.81, 1.54, 1.33, 1.02, 1.32, 1.13, 0.81, -0.02, 1.43, 0.55, 16.39, 1.97, 0.69, -0.08, 3.45, 6.36, 0.77, 0.25, 1.29, 3.89, 1.35, 0.01, -0.19, 2.74, 1.34, 1.01, 0.17, 0.3, 2.13, 0.49, 0.84, 1.25, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/uGg9-5_0On4_filtered.json b/annotations_filtered/uGg9-5_0On4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4454cdc14a41067da185e7ae2f514c9f460b253f --- /dev/null +++ b/annotations_filtered/uGg9-5_0On4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.05], [18.0, 18.96], [20.0, 33.34], [36.0, 37.13], [40.0, 40.2], [42.0, 42.7], [51.0, 51.11], [57.0, 58.08], [64.0, 65.64], [68.0, 69.15], [71.0, 78.76], [79.0, 84.42], [104.0, 105.81], [109.0, 110.89], [112.0, 114.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 97.73, 0.0, 0.0, 84.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.96, 13.34, 1.13, 0.2, 0.7, 0.11, 1.08, 1.64, 1.15, 7.76, 5.42, 1.81, 1.89, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/uGrrtkaWoU8_filtered.json b/annotations_filtered/uGrrtkaWoU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b11c0644b199bbbaa380fccbc60d66c29de4442 --- /dev/null +++ b/annotations_filtered/uGrrtkaWoU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.92], [23.0, 60.88], [65.0, 69.99], [70.0, 71.25], [94.0, 97.24], [99.0, 120.93], [122.0, 122.72]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [95.37, 0.0, 49.73, 0.0, 67.76, 75.88, 0.0], "audiomae_on_audioset": [null, null, [["music", 28.67], ["sidetone", 22.24], ["speech", 17.3]], null, null, null, null], "duration": [4.92, 37.88, 4.99, 1.25, 3.24, 21.93, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/uGsWYV2bWAc_filtered.json b/annotations_filtered/uGsWYV2bWAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45da8c32335d46fba08ede8afab553df52d73473 --- /dev/null +++ b/annotations_filtered/uGsWYV2bWAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 80.7]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [49.7]} \ No newline at end of file diff --git a/annotations_filtered/uGstM8QMCjQ_filtered.json b/annotations_filtered/uGstM8QMCjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c44c8b672843d8eccdf317a761d89df775d6aa --- /dev/null +++ b/annotations_filtered/uGstM8QMCjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 27.4], [29.0, 33.52], [34.0, 34.13], [35.0, 35.65], [38.0, 37.93], [42.0, 42.31], [43.0, 44.54], [45.0, 57.37], [59.0, 60.56], [63.0, 63.85], [65.0, 65.55], [73.0, 73.6], [75.0, 75.98], [78.0, 79.14], [80.0, 84.79], [85.0, 84.82], [85.0, 85.09], [88.0, 92.1], [95.0, 98.19], [100.0, 100.5], [101.0, 102.59], [103.0, 103.49]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false], "silence_prob": [33.77, 32.26, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.5, 0.0, 0.0, 31.5, 33.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.95], ["speech", 31.49], ["hum", 6.07]], [["speech", 36.08], ["music", 16.56], ["sidetone", 13.49]], null, null, null, null, null, [["speech", 38.36], ["livestock, farm animals, working animals", 7.93], ["cattle, bovinae", 7.66]], null, null, null, null, null, null, [["speech", 54.95], ["fart", 9.18], ["explosion", 4.73]], null, null, [["fart", 17.6], ["animal", 14.96], ["speech", 13.78]], [["fart", 38.69], ["beep, bleep", 8.36], ["busy signal", 8.35]], null, null, null], "duration": [15.4, 4.52, 0.13, 0.65, -0.07, 0.31, 1.54, 12.37, 1.56, 0.85, 0.55, 0.6, 0.98, 1.14, 4.79, -0.18, 0.09, 4.1, 3.19, 0.5, 1.59, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/uHltDaQU1uc_filtered.json b/annotations_filtered/uHltDaQU1uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f90890f85b525721241f9fb753b2e54a4ec32a7 --- /dev/null +++ b/annotations_filtered/uHltDaQU1uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.72], [25.0, 27.13], [29.0, 29.69], [34.0, 48.56], [49.0, 48.59], [51.0, 63.36], [67.0, 69.28], [71.0, 72.99], [73.0, 74.46], [86.0, 86.9], [91.0, 92.43], [94.0, 95.13], [100.0, 108.19], [112.0, 125.46], [127.0, 130.08], [131.0, 131.57], [133.0, 133.41], [134.0, 142.87], [146.0, 147.07], [150.0, 153.25], [154.0, 155.07], [157.0, 160.49], [164.0, 165.35], [166.0, 168.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, true], "silence_prob": [42.58, 51.34, 0.0, 33.52, 0.0, 38.4, 37.14, 0.0, 0.0, 0.0, 0.0, 0.0, 31.99, 33.82, 31.96, 0.0, 0.0, 29.18, 0.0, 30.39, 0.0, 37.63, 0.0, 29.41], "audiomae_on_audioset": [[["music", 67.43], ["speech", 9.19], ["electronic music", 3.6]], null, null, [["music", 39.12], ["throbbing", 35.53], ["hum", 6.77]], null, [["music", 56.4], ["didgeridoo", 6.35], ["throbbing", 5.36]], [["music", 69.07], ["throbbing", 8.53], ["hum", 2.23]], null, null, null, null, null, [["music", 82.3], ["musical instrument", 1.07], ["middle eastern music", 0.87]], [["music", 82.7], ["throbbing", 2.97], ["hum", 1.81]], [["music", 32.16], ["hum", 6.9], ["throbbing", 5.32]], null, null, [["speech", 62.41], ["music", 17.13], ["explosion", 4.18]], null, [["throbbing", 22.86], ["music", 22.62], ["scratching (performance technique)", 4.54]], null, [["music", 36.18], ["whale vocalization", 23.3], ["speech", 4.2]], null, [["theremin", 26.15], ["music", 19.59], ["synthesizer", 6.98]]], "duration": [7.72, 2.13, 0.69, 14.56, -0.41, 12.36, 2.28, 1.99, 1.46, 0.9, 1.43, 1.13, 8.19, 13.46, 3.08, 0.57, 0.41, 8.87, 1.07, 3.25, 1.07, 3.49, 1.35, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/uHuDwL4XEUE_filtered.json b/annotations_filtered/uHuDwL4XEUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e2b5f69a23579b23f9920e313384a2b062f9739 --- /dev/null +++ b/annotations_filtered/uHuDwL4XEUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [8.0, 9.15], [10.0, 10.27], [11.0, 14.35], [17.0, 17.25], [20.0, 21.44], [25.0, 26.18], [28.0, 33.91], [35.0, 38.43], [39.0, 40.54], [48.0, 52.0], [55.0, 61.57], [63.0, 68.39], [69.0, 72.05], [73.0, 77.45], [78.0, 84.15], [85.0, 86.24], [86.0, 96.01], [99.0, 111.94], [112.0, 112.02], [112.0, 112.16], [115.0, 119.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 93.91, 91.3, 0.0, 95.09, 95.09, 92.48, 98.8, 98.36, 95.23, 0.0, 80.64, 99.82, 0.0, 0.0, 99.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.15, 0.27, 3.35, 0.25, 1.44, 1.18, 5.91, 3.43, 1.54, 4.0, 6.57, 5.39, 3.05, 4.45, 6.15, 1.24, 10.01, 12.94, 0.02, 0.16, 4.45]} \ No newline at end of file diff --git a/annotations_filtered/uI4fVgVVpiw_filtered.json b/annotations_filtered/uI4fVgVVpiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9ce84928e9f5464b962b3714dfb2acf2012385 --- /dev/null +++ b/annotations_filtered/uI4fVgVVpiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.58], [17.0, 17.2], [44.0, 44.85]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.58, 0.2, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/uI7ijvSCHcI_filtered.json b/annotations_filtered/uI7ijvSCHcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d52a564432690e3c08f41dbe32b253c8a124d43a --- /dev/null +++ b/annotations_filtered/uI7ijvSCHcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.24], [6.0, 21.12], [21.0, 28.53], [29.0, 54.24], [57.0, 58.51], [73.0, 76.67], [77.0, 88.32], [90.0, 95.05], [100.0, 103.79], [107.0, 119.55], [127.0, 127.72], [145.0, 145.29], [146.0, 146.28], [152.0, 153.4], [157.0, 157.82], [158.0, 161.7], [171.0, 171.73], [172.0, 180.69]], "keep_status": [false, true, true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.51, 31.89, 32.16, 0.0, 34.05, 32.71, 31.62, 32.38, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 85.17], "audiomae_on_audioset": [null, [["hum", 27.97], ["speech", 17.9], ["throbbing", 15.65]], [["sidetone", 35.4], ["speech", 20.97], ["music", 13.56]], [["music", 23.42], ["livestock, farm animals, working animals", 13.22], ["cattle, bovinae", 8.1]], null, [["fly, housefly", 59.92], ["insect", 28.5], ["mosquito", 4.6]], [["speech", 39.39], ["music", 31.18], ["buzz", 6.12]], [["music", 25.37], ["speech", 23.28], ["hum", 7.54]], [["whale vocalization", 34.86], ["music", 25.48], ["hum", 10.61]], [["music", 50.59], ["theremin", 4.02], ["hum", 3.82]], null, null, null, null, null, [["fly, housefly", 43.5], ["insect", 21.56], ["mosquito", 20.21]], null, null], "duration": [0.24, 15.12, 7.53, 25.24, 1.51, 3.67, 11.32, 5.05, 3.79, 12.55, 0.72, 0.29, 0.28, 1.4, 0.82, 3.7, 0.73, 8.69]} \ No newline at end of file diff --git a/annotations_filtered/uIBDomdpK7Y_filtered.json b/annotations_filtered/uIBDomdpK7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebcaac44b5e1a0125e1ada54e4b60539c9c9cbdc --- /dev/null +++ b/annotations_filtered/uIBDomdpK7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.54], [2.0, 2.27], [4.0, 5.16], [13.0, 14.2], [16.0, 17.73], [20.0, 21.0], [22.0, 24.65], [26.0, 27.13], [28.0, 28.41], [29.0, 30.35], [31.0, 32.66], [34.0, 34.59], [38.0, 39.33], [42.0, 42.42], [47.0, 47.24], [54.0, 55.0], [56.0, 57.4], [60.0, 59.76], [63.0, 67.69], [70.0, 71.34], [73.0, 76.28], [79.0, 80.35], [82.0, 81.92], [83.0, 85.14], [86.0, 87.25], [89.0, 89.11], [90.0, 90.53], [96.0, 97.38], [99.0, 104.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 48.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.62], ["music", 9.88], ["fart", 7.61]]], "duration": [-0.46, 0.27, 1.16, 1.2, 1.73, 1.0, 2.65, 1.13, 0.41, 1.35, 1.66, 0.59, 1.33, 0.42, 0.24, 1.0, 1.4, -0.24, 4.69, 1.34, 3.28, 1.35, -0.08, 2.14, 1.25, 0.11, 0.53, 1.38, 5.45]} \ No newline at end of file diff --git a/annotations_filtered/uIUCcORbMvg_filtered.json b/annotations_filtered/uIUCcORbMvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc06d4c5e6ca507962fd4e690862a77b5001da98 --- /dev/null +++ b/annotations_filtered/uIUCcORbMvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 36.51], [38.0, 46.26], [49.0, 50.06], [56.0, 56.08], [59.0, 61.91], [63.0, 63.49], [66.0, 65.94], [66.0, 80.32], [82.0, 82.73], [85.0, 89.7], [93.0, 96.77], [104.0, 104.43]], "keep_status": [true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [31.32, 31.83, 0.0, 0.0, 32.49, 0.0, 0.0, 30.74, 0.0, 30.2, 37.22, 0.0], "audiomae_on_audioset": [[["music", 40.37], ["speech", 13.5], ["groan", 7.98]], [["music", 36.88], ["speech", 21.25], ["moo", 3.97]], null, null, [["speech", 81.71], ["boing", 1.88], ["chop", 1.2]], null, null, [["speech", 69.06], ["whack, thwack", 4.65], ["fart", 2.25]], null, [["speech", 24.23], ["music", 13.18], ["thunk", 8.21]], [["music", 68.49], ["didgeridoo", 9.33], ["musical instrument", 3.7]], null], "duration": [23.51, 8.26, 1.06, 0.08, 2.91, 0.49, -0.06, 14.32, 0.73, 4.7, 3.77, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/uIl9IFcIXlg_filtered.json b/annotations_filtered/uIl9IFcIXlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9541c817c8bbf807b34e60e46d9637a9e9ff7a6 --- /dev/null +++ b/annotations_filtered/uIl9IFcIXlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 109.73]], "keep_status": [true], "silence_prob": [35.77], "audiomae_on_audioset": [[["music", 30.18], ["livestock, farm animals, working animals", 17.27], ["cattle, bovinae", 12.02]]], "duration": [29.73]} \ No newline at end of file diff --git a/annotations_filtered/uIsdG0ydS5o_filtered.json b/annotations_filtered/uIsdG0ydS5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b219e8be4484805a2f5aeb9717a159d29d893bb6 --- /dev/null +++ b/annotations_filtered/uIsdG0ydS5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [8.0, 11.37], [15.0, 16.04], [16.0, 16.07], [16.0, 24.44], [24.0, 27.41], [29.0, 29.93], [50.0, 51.21], [56.0, 58.02], [59.0, 60.98], [71.0, 72.45], [84.0, 84.38], [85.0, 86.05], [96.0, 104.08], [106.0, 108.01], [110.0, 116.02], [120.0, 120.02], [120.0, 120.14], [120.0, 120.65], [125.0, 125.49], [127.0, 127.75], [129.0, 135.55], [142.0, 142.37], [143.0, 145.27], [147.0, 150.99], [154.0, 161.62], [166.0, 166.5], [172.0, 180.15], [182.0, 190.27], [195.0, 196.11], [201.0, 207.17], [210.0, 219.94], [221.0, 221.49], [222.0, 223.91], [225.0, 228.48]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 38.67, 0.0, 0.0, 29.41, 28.97, 0.0, 0.0, 30.62, 0.0, 0.0, 0.0, 0.0, 34.17, 35.18, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 29.96, 0.0, 29.51, 30.8, 29.91, 0.0, 29.97, 30.1, 0.0, 29.89, 36.58, 0.0, 0.0, 28.91], "audiomae_on_audioset": [null, [["music", 59.29], ["throbbing", 7.93], ["hum", 6.35]], null, null, [["music", 53.93], ["throbbing", 18.77], ["hum", 7.8]], [["music", 26.96], ["hum", 12.84], ["animal", 6.44]], null, null, [["speech", 65.53], ["radio", 2.85], ["static", 2.18]], null, null, null, null, [["speech", 36.51], ["music", 17.4], ["hum", 6.58]], [["hum", 33.84], ["throbbing", 26.47], ["music", 16.72]], [["music", 27.73], ["speech", 17.17], ["animal", 11.34]], null, null, null, null, null, [["music", 38.93], ["speech", 23.47], ["throbbing", 6.75]], null, [["speech", 25.35], ["music", 12.09], ["sound effect", 6.41]], [["skateboard", 19.44], ["speech", 12.78], ["whip", 11.5]], [["music", 30.97], ["boing", 28.99], ["speech", 12.75]], null, [["speech", 49.11], ["music", 24.22], ["groan", 3.49]], [["speech", 41.23], ["music", 28.92], ["whack, thwack", 6.64]], null, [["music", 42.11], ["throbbing", 13.88], ["hum", 13.35]], [["music", 49.03], ["speech", 19.18], ["theremin", 9.22]], null, null, [["music", 18.86], ["whack, thwack", 13.89], ["whip", 13.59]]], "duration": [0.42, 3.37, 1.04, 0.07, 8.44, 3.41, 0.93, 1.21, 2.02, 1.98, 1.45, 0.38, 1.05, 8.08, 2.01, 6.02, 0.02, 0.14, 0.65, 0.49, 0.75, 6.55, 0.37, 2.27, 3.99, 7.62, 0.5, 8.15, 8.27, 1.11, 6.17, 9.94, 0.49, 1.91, 3.48]} \ No newline at end of file diff --git a/annotations_filtered/uJMPom6-xmA_filtered.json b/annotations_filtered/uJMPom6-xmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c6d64cd6bd05d054e0644e4e2574a23f7d149f7 --- /dev/null +++ b/annotations_filtered/uJMPom6-xmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [4.0, 4.04], [22.0, 24.98], [27.0, 27.35], [28.0, 29.91], [33.0, 33.88], [36.0, 38.18], [42.0, 42.47], [54.0, 54.62], [59.0, 59.83], [61.0, 68.3], [71.0, 73.63], [83.0, 83.56], [86.0, 86.8], [90.0, 91.13], [92.0, 96.18], [118.0, 118.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 52.45, 42.74, 0.0, 0.0, 0.0, 97.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 49.68], ["music", 19.95], ["hum", 1.89]], null, null, null, null, null, null, null, null, [["music", 36.14], ["throbbing", 9.36], ["hum", 7.97]], null, null, null, null, null], "duration": [0.43, 0.04, 2.98, 0.35, 1.91, 0.88, 2.18, 0.47, 0.62, 0.83, 7.3, 2.63, 0.56, 0.8, 1.13, 4.18, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/uJNHr8QQVJQ_filtered.json b/annotations_filtered/uJNHr8QQVJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d704afe40f2c11481418cb5173f643d4872ee896 --- /dev/null +++ b/annotations_filtered/uJNHr8QQVJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.25], [29.0, 29.61], [34.0, 34.52], [39.0, 38.91], [40.0, 40.59], [41.0, 42.33], [44.0, 44.19], [47.0, 47.76], [49.0, 51.49], [61.0, 61.5], [67.0, 67.24], [79.0, 79.12], [86.0, 86.29], [88.0, 122.45], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.25, 0.61, 0.52, -0.09, 0.59, 1.33, 0.19, 0.76, 2.49, 0.5, 0.24, 0.12, 0.29, 34.45, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/uJPI1qu9bE4_filtered.json b/annotations_filtered/uJPI1qu9bE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8814a73c307a06e213fc8c4ddfe23e31f04d4c --- /dev/null +++ b/annotations_filtered/uJPI1qu9bE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [5.0, 6.47], [10.0, 12.12], [13.0, 13.76], [16.0, 16.28], [19.0, 19.31], [20.0, 20.39], [26.0, 28.68], [32.0, 33.84], [35.0, 36.88], [39.0, 43.34], [46.0, 47.26], [49.0, 52.68], [54.0, 57.64], [58.0, 59.31], [60.0, 62.56], [63.0, 65.75], [67.0, 67.41], [71.0, 77.43], [78.0, 80.2], [83.0, 84.05], [86.0, 87.66], [89.0, 91.56], [96.0, 97.09], [98.0, 100.52], [102.0, 104.94], [106.0, 106.69], [107.0, 122.42], [125.0, 130.5]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 38.5, 0.0, 0.0, 59.33, 0.0, 45.69, 64.41, 0.0, 79.76, 38.66, 0.0, 57.25, 88.83, 0.0, 0.0, 37.95, 0.0, 89.01, 97.64, 0.0, 94.37, 70.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["bouncing", 19.88], ["basketball bounce", 18.84], ["music", 6.79]], null, null, null, null, [["hum", 42.95], ["mains hum", 18.57], ["throbbing", 9.6]], null, null, null, [["hum", 35.5], ["mains hum", 26.61], ["whale vocalization", 16.59]], null, null, null, null, null, [["speech", 18.66], ["hum", 14.69], ["mains hum", 8.1]], null, null, null, null, null, null], "duration": [1.55, 1.47, 2.12, 0.76, 0.28, 0.31, 0.39, 2.68, 1.84, 1.88, 4.34, 1.26, 3.68, 3.64, 1.31, 2.56, 2.75, 0.41, 6.43, 2.2, 1.05, 1.66, 2.56, 1.09, 2.52, 2.94, 0.69, 15.42, 5.5]} \ No newline at end of file diff --git a/annotations_filtered/uJlhwWFAAxI_filtered.json b/annotations_filtered/uJlhwWFAAxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uJlhwWFAAxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uJnIaD7gDlQ_filtered.json b/annotations_filtered/uJnIaD7gDlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uJnIaD7gDlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uKZQEDh_KAA_filtered.json b/annotations_filtered/uKZQEDh_KAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9ee1b28b7b21bb39e10bdae0925b0528841cc4c --- /dev/null +++ b/annotations_filtered/uKZQEDh_KAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [21.0, 48.15], [52.0, 54.14], [60.0, 62.33], [66.0, 67.04], [70.0, 71.27], [78.0, 78.21], [83.0, 84.1], [100.0, 101.17], [110.0, 110.54], [112.0, 112.78], [116.0, 116.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.39, 84.07, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 27.15, 2.14, 2.33, 1.04, 1.27, 0.21, 1.1, 1.17, 0.54, 0.78, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/uKwwpmC02IQ_filtered.json b/annotations_filtered/uKwwpmC02IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a5c87c63f49fff479f3d3590cae5600a4dfcc30 --- /dev/null +++ b/annotations_filtered/uKwwpmC02IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.22], [21.0, 21.47], [24.0, 24.95], [30.0, 31.58], [45.0, 45.22], [57.0, 58.63], [64.0, 65.31], [71.0, 72.0], [83.0, 84.91], [91.0, 91.44], [111.0, 113.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.06], ["synthesizer", 4.58], ["musical instrument", 3.79]]], "duration": [0.22, 0.47, 0.95, 1.58, 0.22, 1.63, 1.31, 1.0, 1.91, 0.44, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/uL2gxb-TcLM_filtered.json b/annotations_filtered/uL2gxb-TcLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..276612cae33b04160237052589a8cae7f484d500 --- /dev/null +++ b/annotations_filtered/uL2gxb-TcLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.54], [2.0, 3.55], [5.0, 4.82], [7.0, 26.64], [33.0, 33.49], [41.0, 45.23], [59.0, 58.62], [61.0, 61.25], [64.0, 68.69], [72.0, 72.67], [82.0, 86.05], [88.0, 90.22], [92.0, 92.97], [94.0, 97.11], [99.0, 98.79], [99.0, 100.01], [106.0, 106.51], [109.0, 111.6], [113.0, 113.21], [116.0, 116.92], [118.0, 118.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.35, 0.0, 90.43, 0.0, 0.0, 97.64, 0.0, 48.52, 77.53, 0.0, 51.88, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 73.12], ["electronic music", 4.75], ["techno", 2.43]], null, null, null, null, null, null, [["fireworks", 20.14], ["speech", 17.02], ["firecracker", 5.29]], null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 1.55, -0.18, 19.64, 0.49, 4.23, -0.38, 0.25, 4.69, 0.67, 4.05, 2.22, 0.97, 3.11, -0.21, 1.01, 0.51, 2.6, 0.21, 0.92, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/uLYYXvBlUgQ_filtered.json b/annotations_filtered/uLYYXvBlUgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b80c1a142e4071a66062c931ad51143f8b5e65b7 --- /dev/null +++ b/annotations_filtered/uLYYXvBlUgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [20.0, 20.87], [23.0, 23.85], [29.0, 29.0], [40.0, 47.58], [50.0, 52.02], [54.0, 55.98], [57.0, 59.27], [62.0, 62.78], [66.0, 69.5], [70.0, 71.86], [75.0, 75.86], [76.0, 81.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.94, 95.51, 0.0, 97.11, 0.0, 99.31, 0.0, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.87, 0.85, 0.0, 7.58, 2.02, 1.98, 2.27, 0.78, 3.5, 1.86, 0.86, 5.46]} \ No newline at end of file diff --git a/annotations_filtered/uLhrOeavvOY_filtered.json b/annotations_filtered/uLhrOeavvOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db325f29442a9d33ee3d6c634baa42103e30df34 --- /dev/null +++ b/annotations_filtered/uLhrOeavvOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 26.47], [31.0, 31.56], [32.0, 90.44], [91.0, 91.77], [92.0, 91.84], [92.0, 92.11], [93.0, 94.9], [98.0, 113.68], [115.0, 119.77], [121.0, 123.96], [125.0, 148.74]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true], "silence_prob": [41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.21, 47.82, 48.52, 42.98], "audiomae_on_audioset": [[["speech", 45.92], ["music", 24.28], ["musical instrument", 3.4]], null, null, null, null, null, null, [["speech", 23.55], ["music", 20.59], ["breaking", 5.37]], [["music", 37.7], ["splinter", 13.58], ["crushing", 8.54]], [["music", 22.83], ["singing bowl", 15.0], ["gong", 6.86]], [["music", 31.93], ["singing bowl", 16.2], ["ambient music", 10.88]]], "duration": [7.47, 0.56, 58.44, 0.77, -0.16, 0.11, 1.9, 15.68, 4.77, 2.96, 23.74]} \ No newline at end of file diff --git a/annotations_filtered/uLquz4Iz-30_filtered.json b/annotations_filtered/uLquz4Iz-30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f30c84fd903478c17e736c253dfe2305d16e1eb --- /dev/null +++ b/annotations_filtered/uLquz4Iz-30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 43.46], [50.0, 51.7], [55.0, 62.36], [64.0, 72.15], [75.0, 91.39], [92.0, 91.93], [93.0, 93.09], [94.0, 96.25], [98.0, 109.86], [113.0, 132.31], [141.0, 140.85], [147.0, 148.32]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 36.67, 35.42, 35.86, 0.0, 0.0, 32.23, 33.31, 35.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 67.3], ["hum", 7.76], ["mains hum", 6.07]], [["speech", 41.75], ["music", 34.48], ["sidetone", 5.56]], [["music", 60.71], ["whack, thwack", 6.54], ["fart", 2.77]], null, null, [["music", 50.08], ["speech", 17.16], ["sidetone", 4.63]], [["speech", 20.35], ["fly, housefly", 20.04], ["music", 14.9]], [["noise", 23.98], ["frog", 9.84], ["fart", 8.77]], null, null], "duration": [31.46, 1.7, 7.36, 8.15, 16.39, -0.07, 0.09, 2.25, 11.86, 19.31, -0.15, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/uLt7lXDCHQ0_filtered.json b/annotations_filtered/uLt7lXDCHQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fbe899663e706a2122a4ae014ba4de318711a37 --- /dev/null +++ b/annotations_filtered/uLt7lXDCHQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[175.0, 175.31]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.31]} \ No newline at end of file diff --git a/annotations_filtered/uLtUl4pDmOs_filtered.json b/annotations_filtered/uLtUl4pDmOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..121137365a46f0233d7e4129e01544d574a53889 --- /dev/null +++ b/annotations_filtered/uLtUl4pDmOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.68], [5.0, 5.68], [10.0, 10.27], [10.0, 10.3], [10.0, 10.34], [10.0, 10.37], [10.0, 13.59], [18.0, 18.72], [24.0, 25.52], [26.0, 31.04], [31.0, 33.27], [42.0, 43.33], [46.0, 49.28], [50.0, 49.94], [50.0, 53.79], [58.0, 59.56], [60.0, 78.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 95.51, 42.11, 0.0, 95.64, 0.0, 49.87, 0.0, 35.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 23.48], ["grunt", 14.54], ["fart", 7.76]], null, null, null, [["roaring cats (lions, tigers)", 16.38], ["wild animals", 14.34], ["speech", 13.99]], null, [["animal", 60.74], ["roaring cats (lions, tigers)", 14.42], ["speech", 11.41]]], "duration": [0.68, 0.68, 0.27, 0.3, 0.34, 0.37, 3.59, 0.72, 1.52, 5.04, 2.27, 1.33, 3.28, -0.06, 3.79, 1.56, 18.9]} \ No newline at end of file diff --git a/annotations_filtered/uMH_Ajdp3E0_filtered.json b/annotations_filtered/uMH_Ajdp3E0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f7f1b00c3fecdc6f31ba49ab399a6e92771be89 --- /dev/null +++ b/annotations_filtered/uMH_Ajdp3E0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.02], [1.0, 7.01], [9.0, 10.81], [15.0, 16.23], [26.0, 27.97], [29.0, 29.42], [31.0, 33.44], [37.0, 38.79], [40.0, 42.6], [46.0, 47.21], [48.0, 48.09], [54.0, 56.27]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 52.22, 0.0, 40.64, 0.0, 0.0, 37.02], "audiomae_on_audioset": [null, [["fly, housefly", 28.63], ["insect", 14.52], ["hum", 13.13]], null, null, null, null, null, null, [["hum", 14.96], ["hoot", 12.81], ["sidetone", 10.45]], null, null, [["hum", 41.26], ["mains hum", 34.5], ["throbbing", 3.25]]], "duration": [0.02, 6.01, 1.81, 1.23, 1.97, 0.42, 2.44, 1.79, 2.6, 1.21, 0.09, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/uMb3tldMyn0_filtered.json b/annotations_filtered/uMb3tldMyn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b08f50b9382e8071ab06f019314b1960a7b743e --- /dev/null +++ b/annotations_filtered/uMb3tldMyn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [12.0, 21.24], [26.0, 26.23], [26.0, 31.08], [36.0, 91.56], [98.0, 100.67], [102.0, 103.42], [107.0, 107.37], [109.0, 110.13], [111.0, 111.7], [115.0, 116.38], [118.0, 118.91], [120.0, 122.39], [123.0, 132.07], [133.0, 135.36], [137.0, 137.0], [139.0, 141.22], [146.0, 148.0], [149.0, 151.39], [153.0, 156.86], [157.0, 159.0], [159.0, 163.11]], "keep_status": [false, true, false, true, false, true, false, false, false, false, false, false, true, true, true, false, true, true, true, true, true, true], "silence_prob": [0.0, 33.54, 0.0, 30.65, 0.0, 32.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.26, 42.91, 42.96, 0.0, 45.33, 44.9, 45.24, 41.76, 39.27, 39.33], "audiomae_on_audioset": [null, [["music", 31.02], ["speech", 23.56], ["throbbing", 9.36]], null, [["music", 21.48], ["mains hum", 20.1], ["speech", 19.39]], null, [["sheep", 30.81], ["bleat", 16.0], ["whale vocalization", 8.13]], null, null, null, null, null, null, [["speech", 30.38], ["hum", 10.81], ["whale vocalization", 10.09]], [["speech", 45.65], ["animal", 6.31], ["howl", 5.99]], [["speech", 27.14], ["hum", 23.23], ["mains hum", 9.96]], null, [["speech", 25.91], ["music", 6.03], ["whale vocalization", 3.62]], [["speech", 17.55], ["hum", 4.25], ["rumble", 3.06]], [["hum", 25.25], ["whale vocalization", 8.42], ["throbbing", 7.29]], [["speech", 54.81], ["hum", 9.43], ["whale vocalization", 5.32]], [["speech", 30.55], ["music", 13.95], ["civil defense siren", 9.5]], [["whale vocalization", 34.43], ["siren", 9.25], ["hum", 7.57]]], "duration": [0.64, 9.24, 0.23, 5.08, 55.56, 2.67, 1.42, 0.37, 1.13, 0.7, 1.38, 0.91, 2.39, 9.07, 2.36, 0.0, 2.22, 2.0, 2.39, 3.86, 2.0, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/uMug9lL1Sgg_filtered.json b/annotations_filtered/uMug9lL1Sgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec90a32362d32bc4af25765264057578b679a421 --- /dev/null +++ b/annotations_filtered/uMug9lL1Sgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.39], [25.0, 29.34], [33.0, 32.75], [40.0, 40.81], [41.0, 42.23], [52.0, 52.91], [59.0, 61.97], [65.0, 71.19], [72.0, 75.34]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.89, 0.0, 0.0, 0.0, 0.0, 99.95, 99.78, 87.92], "audiomae_on_audioset": [null, [["speech", 27.6], ["animal", 16.75], ["boing", 5.4]], null, null, null, null, null, null, null], "duration": [1.39, 4.34, -0.25, 0.81, 1.23, 0.91, 2.97, 6.19, 3.34]} \ No newline at end of file diff --git a/annotations_filtered/uNE1lEBsBmM_filtered.json b/annotations_filtered/uNE1lEBsBmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bed76393cff930d83fac51a3db8803f0279aaf1 --- /dev/null +++ b/annotations_filtered/uNE1lEBsBmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.92], [3.0, 3.86], [4.0, 5.24], [5.0, 11.96], [13.0, 13.78], [14.0, 16.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 67.13, 0.0, 61.57], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.08, 0.86, 1.24, 6.96, 0.78, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/uNPU0cPPsmA_filtered.json b/annotations_filtered/uNPU0cPPsmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba196a1749b3e6ab7d883c1d2edfb5495789d00a --- /dev/null +++ b/annotations_filtered/uNPU0cPPsmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.5], [10.0, 9.93], [10.0, 10.91], [19.0, 19.6], [26.0, 28.0], [32.0, 33.2], [35.0, 34.89], [38.0, 39.39], [45.0, 47.09]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.54, 0.0, 0.0, 0.0, 35.3], "audiomae_on_audioset": [null, null, null, null, [["music", 61.53], ["didgeridoo", 10.4], ["musical instrument", 3.67]], null, null, null, [["music", 31.93], ["speech", 24.09], ["sidetone", 4.0]]], "duration": [0.5, -0.07, 0.91, 0.6, 2.0, 1.2, -0.11, 1.39, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/uNcKTuAqLag_filtered.json b/annotations_filtered/uNcKTuAqLag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6fdb4186a16a7dd557703758d5b643a5d43c41f --- /dev/null +++ b/annotations_filtered/uNcKTuAqLag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.48], [8.0, 8.45], [10.0, 11.55], [13.0, 13.9], [17.0, 18.01], [23.0, 25.81], [27.0, 27.62], [29.0, 29.79], [35.0, 37.67], [39.0, 39.38], [40.0, 46.87], [51.0, 52.71], [57.0, 58.43], [61.0, 61.86], [64.0, 64.72], [66.0, 68.32], [73.0, 74.22], [80.0, 81.58], [82.0, 83.74], [87.0, 87.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 56.4, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 55.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 0.45, 1.55, 0.9, 1.01, 2.81, 0.62, 0.79, 2.67, 0.38, 6.87, 1.71, 1.43, 0.86, 0.72, 2.32, 1.22, 1.58, 1.74, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/uNjrnjiEEY8_filtered.json b/annotations_filtered/uNjrnjiEEY8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1a29cbff34568141c094ff69ee6cf679892aaa3 --- /dev/null +++ b/annotations_filtered/uNjrnjiEEY8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.19], [13.0, 13.39], [14.0, 15.3], [17.0, 19.04], [21.0, 22.54], [33.0, 32.53], [34.0, 36.63], [41.0, 43.6], [49.0, 48.9], [55.0, 55.71], [56.0, 56.76], [57.0, 56.84], [57.0, 60.76], [64.0, 64.3], [70.0, 74.68], [77.0, 78.97], [87.0, 91.62], [110.0, 110.52], [113.0, 113.39], [116.0, 118.18], [119.0, 119.03], [120.0, 121.26], [123.0, 123.85], [126.0, 126.4], [128.0, 130.2], [135.0, 137.39], [139.0, 140.66], [141.0, 141.86], [144.0, 149.86], [151.0, 151.71], [153.0, 155.36]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.46, 0.0, 0.0, 31.46, 33.4, 0.0, 0.0, 0.0, 0.0, 36.02, 0.0, 36.67, 0.0, 97.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 95.37, 94.52, 0.0, 0.0, 64.18, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, [["music", 65.85], ["fart", 7.93], ["mosquito", 1.61]], null, null, [["music", 33.15], ["groan", 13.83], ["bleat", 10.15]], [["boing", 25.48], ["music", 19.1], ["mosquito", 7.66]], null, null, null, null, [["music", 40.99], ["boing", 18.14], ["salsa music", 4.53]], null, [["music", 36.88], ["speech", 11.25], ["boing", 7.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.39, 1.3, 2.04, 1.54, -0.47, 2.63, 2.6, -0.1, 0.71, 0.76, -0.16, 3.76, 0.3, 4.68, 1.97, 4.62, 0.52, 0.39, 2.18, 0.03, 1.26, 0.85, 0.4, 2.2, 2.39, 1.66, 0.86, 5.86, 0.71, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/uNsFppO-q3g_filtered.json b/annotations_filtered/uNsFppO-q3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02056f27360660a09f166dc6699251ba1e00968f --- /dev/null +++ b/annotations_filtered/uNsFppO-q3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [6.0, 7.91], [8.0, 11.69], [13.0, 13.68], [19.0, 21.9], [22.0, 31.55], [32.0, 36.68], [38.0, 48.69], [50.0, 51.73], [53.0, 61.1], [62.0, 62.19], [62.0, 62.45], [62.0, 62.5], [67.0, 69.96], [72.0, 73.57], [75.0, 78.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [62.78, 0.0, 95.37, 0.0, 78.55, 66.76, 73.97, 75.39, 0.0, 78.72, 0.0, 0.0, 0.0, 49.22, 0.0, 30.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["gong", 23.39], ["music", 17.68], ["hum", 6.92]], null, [["music", 60.83], ["didgeridoo", 7.19], ["guitar", 6.6]]], "duration": [2.14, 1.91, 3.69, 0.68, 2.9, 9.55, 4.68, 10.69, 1.73, 8.1, 0.19, 0.45, 0.5, 2.96, 1.57, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/uOHMPcGgInI_filtered.json b/annotations_filtered/uOHMPcGgInI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..038f0d3a7abd5669d92ec4d90b018d2d9deb741e --- /dev/null +++ b/annotations_filtered/uOHMPcGgInI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 23.06], [32.0, 33.34], [33.0, 58.72], [61.0, 77.21], [80.0, 86.66], [88.0, 121.81], [123.0, 123.36], [125.0, 130.05], [131.0, 131.92], [134.0, 135.3], [136.0, 141.12], [144.0, 144.83], [146.0, 155.16], [156.0, 157.47], [158.0, 167.75], [168.0, 177.35]], "keep_status": [true, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [29.33, 0.0, 28.62, 28.74, 30.36, 0.0, 0.0, 30.66, 0.0, 0.0, 29.2, 0.0, 30.15, 0.0, 28.86, 29.57], "audiomae_on_audioset": [[["music", 22.56], ["throbbing", 20.9], ["hum", 12.86]], null, [["music", 56.77], ["speech", 20.53], ["buzz", 7.5]], [["music", 32.45], ["speech", 25.13], ["buzz", 4.39]], [["fly, housefly", 66.01], ["insect", 13.67], ["bee, wasp, etc.", 4.21]], null, null, [["speech", 25.51], ["fly, housefly", 16.78], ["insect", 8.94]], null, null, [["music", 10.17], ["insect", 9.41], ["fly, housefly", 8.89]], null, [["music", 50.09], ["speech", 29.74], ["mains hum", 3.46]], null, [["music", 66.96], ["mains hum", 10.27], ["hum", 3.99]], [["speech", 69.78], ["music", 9.77], ["outside, rural or natural", 1.5]]], "duration": [13.06, 1.34, 25.72, 16.21, 6.66, 33.81, 0.36, 5.05, 0.92, 1.3, 5.12, 0.83, 9.16, 1.47, 9.75, 9.35]} \ No newline at end of file diff --git a/annotations_filtered/uONmjd_RGk4_filtered.json b/annotations_filtered/uONmjd_RGk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abb0a24df820bf6252a5dbcaaf9b5c1ad454a962 --- /dev/null +++ b/annotations_filtered/uONmjd_RGk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [6.0, 6.17], [11.0, 11.25], [12.0, 12.68], [13.0, 13.49], [18.0, 23.99], [25.0, 25.66], [29.0, 28.93], [30.0, 30.33], [39.0, 38.89], [41.0, 41.2], [44.0, 43.68], [73.0, 73.26], [80.0, 81.89], [100.0, 111.47], [115.0, 123.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 36.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 29.33], ["thump, thud", 17.5], ["whack, thwack", 11.68]]], "duration": [0.9, 0.17, 0.25, 0.68, 0.49, 5.99, 0.66, -0.07, 0.33, -0.11, 0.2, -0.32, 0.26, 1.89, 11.47, 8.69]} \ No newline at end of file diff --git a/annotations_filtered/uOmPHEVoSa4_filtered.json b/annotations_filtered/uOmPHEVoSa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d32a763e776ecc28a20921774247fdb275b908a --- /dev/null +++ b/annotations_filtered/uOmPHEVoSa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [5.0, 5.26], [6.0, 7.48], [8.0, 11.87], [14.0, 15.2], [18.0, 20.22], [22.0, 23.48], [24.0, 25.69], [29.0, 31.36], [33.0, 41.17], [46.0, 46.85], [48.0, 48.47], [50.0, 50.9], [51.0, 51.75], [55.0, 55.39], [56.0, 55.97], [58.0, 58.9], [60.0, 61.32], [64.0, 66.01], [67.0, 69.33], [70.0, 71.76], [83.0, 82.66], [86.0, 86.49], [88.0, 89.19], [92.0, 93.28], [95.0, 95.98], [104.0, 105.44], [106.0, 107.65], [109.0, 110.61], [114.0, 116.02], [117.0, 118.74], [120.0, 120.78], [122.0, 123.11], [123.0, 124.33], [127.0, 127.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.0, 0.0, 93.76, 0.0, 0.0, 94.52, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.26, 1.48, 3.87, 1.2, 2.22, 1.48, 1.69, 2.36, 8.17, 0.85, 0.47, 0.9, 0.75, 0.39, -0.03, 0.9, 1.32, 2.01, 2.33, 1.76, -0.34, 0.49, 1.19, 1.28, 0.98, 1.44, 1.65, 1.61, 2.02, 1.74, 0.78, 1.11, 1.33, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/uOmtVFQ3WF8_filtered.json b/annotations_filtered/uOmtVFQ3WF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9976d8c7da0ecc9c66b0853d6390b43bdaa5f5c6 --- /dev/null +++ b/annotations_filtered/uOmtVFQ3WF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.62], [15.0, 15.7], [17.0, 18.35], [21.0, 21.2], [23.0, 24.87], [27.0, 32.46], [36.0, 39.87], [41.0, 42.25], [44.0, 44.78], [47.0, 48.96], [52.0, 53.32], [54.0, 54.48], [55.0, 55.75], [58.0, 58.99], [69.0, 69.35], [70.0, 71.81], [73.0, 74.33], [75.0, 75.79], [77.0, 86.63], [90.0, 90.73], [92.0, 95.13], [97.0, 101.33], [102.0, 102.47], [107.0, 107.15], [107.0, 108.06], [109.0, 110.05], [111.0, 112.31], [113.0, 113.98], [122.0, 124.36], [129.0, 129.56], [132.0, 133.51], [135.0, 138.08], [139.0, 139.29], [142.0, 141.94], [142.0, 141.99], [142.0, 144.49], [146.0, 146.67], [151.0, 152.2], [153.0, 152.96], [154.0, 154.45], [159.0, 159.22], [161.0, 162.46], [163.0, 163.41], [164.0, 164.62], [165.0, 165.32], [166.0, 166.78], [175.0, 177.08], [178.0, 186.17], [187.0, 186.97], [189.0, 190.02], [192.0, 193.14], [194.0, 195.4], [197.0, 198.59], [202.0, 203.25], [207.0, 209.02], [212.0, 213.06], [213.0, 214.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.41, 0.0, 0.0, 0.0, 0.0, 51.39, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.13, 0.0, 77.53, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 0.0, 0.0, 41.54, 0.0, 0.0, 0.0, 44.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.9, 34.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.97], ["synthesizer", 3.31], ["didgeridoo", 2.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 56.11], ["cattle, bovinae", 29.42], ["moo", 11.11]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.86], ["carnatic music", 17.91], ["speech", 9.3]], null, null, null, [["music", 48.95], ["didgeridoo", 8.94], ["sidetone", 7.42]], null, null, null, null, null, null, null, null, null, null, [["sidetone", 37.5], ["music", 37.41], ["didgeridoo", 7.07]], [["music", 30.11], ["didgeridoo", 17.5], ["speech", 12.52]], null, null, null, null, null, null, [["whale vocalization", 74.37], ["music", 7.0], ["gurgling", 1.62]], null, null], "duration": [8.62, 0.7, 1.35, 0.2, 1.87, 5.46, 3.87, 1.25, 0.78, 1.96, 1.32, 0.48, 0.75, 0.99, 0.35, 1.81, 1.33, 0.79, 9.63, 0.73, 3.13, 4.33, 0.47, 0.15, 1.06, 1.05, 1.31, 0.98, 2.36, 0.56, 1.51, 3.08, 0.29, -0.06, -0.01, 2.49, 0.67, 1.2, -0.04, 0.45, 0.22, 1.46, 0.41, 0.62, 0.32, 0.78, 2.08, 8.17, -0.03, 1.02, 1.14, 1.4, 1.59, 1.25, 2.02, 1.06, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/uOnIqWuSCIk_filtered.json b/annotations_filtered/uOnIqWuSCIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e94db07517ceb7777bf4c8cbbf4cca35afa81d2 --- /dev/null +++ b/annotations_filtered/uOnIqWuSCIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [5.0, 5.44], [7.0, 7.69], [27.0, 28.63], [32.0, 37.67], [55.0, 55.0], [64.0, 79.08], [81.0, 89.28], [89.0, 89.31]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.69, 0.0, 30.82, 34.78, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 33.87], ["guitar", 18.31], ["musical instrument", 17.14]], null, [["carnatic music", 44.35], ["music", 33.36], ["speech", 2.42]], [["speech", 67.88], ["insect", 9.56], ["fly, housefly", 6.06]], null], "duration": [0.93, 0.44, 0.69, 1.63, 5.67, 0.0, 15.08, 8.28, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/uPAXLQIxBGY_filtered.json b/annotations_filtered/uPAXLQIxBGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a0c2c2aa013b5eab1e5ad5cd1116c8c73592c5b --- /dev/null +++ b/annotations_filtered/uPAXLQIxBGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.3], [8.0, 10.54], [14.0, 16.31], [19.0, 24.73], [26.0, 27.55], [29.0, 36.49], [46.0, 52.02], [53.0, 54.21], [56.0, 56.44], [59.0, 62.53], [66.0, 67.69], [70.0, 71.63], [73.0, 75.24], [77.0, 77.08], [78.0, 78.22], [79.0, 80.82], [84.0, 86.12], [95.0, 94.98]], "keep_status": [false, true, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.07, 30.58, 31.06, 0.0, 35.96, 30.85, 0.0, 0.0, 70.72, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 58.22, 0.0], "audiomae_on_audioset": [null, [["speech", 43.51], ["crowd", 6.65], ["outside, urban or manmade", 5.95]], [["cattle, bovinae", 32.45], ["livestock, farm animals, working animals", 31.18], ["moo", 27.96]], [["speech", 34.25], ["music", 27.02], ["boing", 4.33]], null, [["music", 19.12], ["electric shaver, electric razor", 6.72], ["speech", 6.5]], [["music", 30.96], ["bleat", 16.68], ["sheep", 11.9]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 2.54, 2.31, 5.73, 1.55, 7.49, 6.02, 1.21, 0.44, 3.53, 1.69, 1.63, 2.24, 0.08, 0.22, 1.82, 2.12, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/uPFxRUeRfu8_filtered.json b/annotations_filtered/uPFxRUeRfu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..675e044daa1e4469b1b609eac8a4caf06b9d5f18 --- /dev/null +++ b/annotations_filtered/uPFxRUeRfu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.05], [8.0, 8.67], [14.0, 32.0], [40.0, 46.43], [47.0, 48.79], [51.0, 55.85], [56.0, 57.55], [58.0, 74.22], [76.0, 102.24]], "keep_status": [false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 29.98, 32.71, 0.0, 42.98, 0.0, 29.78, 29.43], "audiomae_on_audioset": [null, null, [["mains hum", 37.94], ["hum", 28.45], ["music", 12.43]], [["music", 36.72], ["hum", 14.48], ["mains hum", 12.01]], null, [["music", 65.8], ["animal", 4.57], ["speech", 4.51]], null, [["speech", 46.69], ["vehicle", 13.9], ["car", 6.08]], [["fly, housefly", 19.81], ["insect", 10.27], ["music", 9.27]]], "duration": [1.05, 0.67, 18.0, 6.43, 1.79, 4.85, 1.55, 16.22, 26.24]} \ No newline at end of file diff --git a/annotations_filtered/uPQcsSuWlB4_filtered.json b/annotations_filtered/uPQcsSuWlB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54249ee13160168553f0d841d15424448819cb7b --- /dev/null +++ b/annotations_filtered/uPQcsSuWlB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.43], [24.0, 26.27], [30.0, 82.07], [84.0, 85.51], [87.0, 87.2], [88.0, 120.07]], "keep_status": [true, true, false, false, false, false], "silence_prob": [32.24, 33.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 40.79], ["music", 17.28], ["hum", 4.97]], [["hum", 19.18], ["speech", 18.53], ["rumble", 15.05]], null, null, null, null], "duration": [2.43, 2.27, 52.07, 1.51, 0.2, 32.07]} \ No newline at end of file diff --git a/annotations_filtered/uPQlrPGbD6k_filtered.json b/annotations_filtered/uPQlrPGbD6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e46cac28a8088282c57a75f63d22169a0e18596e --- /dev/null +++ b/annotations_filtered/uPQlrPGbD6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.7], [8.0, 7.97], [8.0, 9.26], [9.0, 9.61], [10.0, 9.85], [11.0, 10.91], [11.0, 11.92], [13.0, 12.87], [13.0, 20.8], [22.0, 22.35], [23.0, 23.26], [25.0, 30.27], [38.0, 39.01], [44.0, 44.27], [57.0, 57.97], [60.0, 60.98], [62.0, 62.07], [64.0, 65.38], [70.0, 84.16], [90.0, 95.96], [97.0, 97.7], [98.0, 99.84], [100.0, 103.54], [104.0, 106.08], [113.0, 114.35], [115.0, 118.66], [120.0, 122.01], [123.0, 125.32], [126.0, 129.22], [133.0, 133.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 99.52, 0.0, 0.0, 96.66, 99.99, 0.0, 100.0, 100.0, 99.95, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, -0.03, 1.26, 0.61, -0.15, -0.09, 0.92, -0.13, 7.8, 0.35, 0.26, 5.27, 1.01, 0.27, 0.97, 0.98, 0.07, 1.38, 14.16, 5.96, 0.7, 1.84, 3.54, 2.08, 1.35, 3.66, 2.01, 2.32, 3.22, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/uPS3iKFXKR4_filtered.json b/annotations_filtered/uPS3iKFXKR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8c4c6f1331625f68f466ccfa19dbd16849e23cc --- /dev/null +++ b/annotations_filtered/uPS3iKFXKR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.88], [12.0, 12.65], [16.0, 22.33], [24.0, 25.91], [29.0, 37.3], [39.0, 40.14], [48.0, 47.83], [48.0, 50.16], [52.0, 54.7], [57.0, 57.92], [62.0, 64.61], [66.0, 67.8], [68.0, 69.82], [74.0, 80.32], [83.0, 84.1], [90.0, 91.67], [92.0, 94.1], [100.0, 100.11], [100.0, 124.29], [129.0, 130.32], [131.0, 131.57], [132.0, 133.64], [135.0, 135.67], [137.0, 136.98], [138.0, 138.5], [142.0, 142.55], [143.0, 144.54], [145.0, 155.41], [157.0, 157.69], [163.0, 165.3], [167.0, 170.55], [172.0, 174.36], [175.0, 177.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 87.55, 0.0, 99.95, 0.0, 0.0, 94.07, 100.0, 0.0, 97.0, 0.0, 0.0, 70.02, 0.0, 0.0, 81.53, 0.0, 34.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 62.68, 91.13, 83.52, 79.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.27], ["hum", 21.42], ["synthesizer", 9.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.88, 0.65, 6.33, 1.91, 8.3, 1.14, -0.17, 2.16, 2.7, 0.92, 2.61, 1.8, 1.82, 6.32, 1.1, 1.67, 2.1, 0.11, 24.29, 1.32, 0.57, 1.64, 0.67, -0.02, 0.5, 0.55, 1.54, 10.41, 0.69, 2.3, 3.55, 2.36, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/uPqgue3xfPI_filtered.json b/annotations_filtered/uPqgue3xfPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc434a24c02c789acd1f129d25d9d328c763461d --- /dev/null +++ b/annotations_filtered/uPqgue3xfPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.6], [24.0, 29.3], [31.0, 39.33], [42.0, 42.69], [44.0, 44.27], [52.0, 52.3], [55.0, 55.09], [56.0, 57.08], [59.0, 59.43], [63.0, 62.75], [67.0, 68.96], [71.0, 72.5], [74.0, 74.04], [77.0, 77.63], [79.0, 79.56], [81.0, 80.96], [88.0, 88.42], [90.0, 90.54], [93.0, 93.75], [95.0, 95.52], [97.0, 98.78], [99.0, 99.89], [103.0, 104.16]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.9, 33.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 71.19], ["echo", 2.98], ["outside, rural or natural", 2.27]], [["speech", 60.36], ["echo", 3.94], ["explosion", 3.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.4, 5.3, 8.33, 0.69, 0.27, 0.3, 0.09, 1.08, 0.43, -0.25, 1.96, 1.5, 0.04, 0.63, 0.56, -0.04, 0.42, 0.54, 0.75, 0.52, 1.78, 0.89, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/uPwo-nHWQaM_filtered.json b/annotations_filtered/uPwo-nHWQaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..708c6c2b6c05a6abd672755013ff8ad4317b8e21 --- /dev/null +++ b/annotations_filtered/uPwo-nHWQaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [6.0, 6.32], [11.0, 16.77], [19.0, 19.04], [29.0, 29.89], [33.0, 33.72], [38.0, 39.07], [44.0, 43.77], [59.0, 60.05], [61.0, 66.73], [69.0, 69.55], [70.0, 77.28], [81.0, 81.62], [86.0, 85.94], [87.0, 87.08], [90.0, 90.14], [96.0, 96.43], [110.0, 110.74], [114.0, 114.59], [117.0, 117.53], [119.0, 119.13], [119.0, 119.16]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.7, 0.0, 38.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 15.04], ["speech", 10.02], ["whale vocalization", 9.9]], null, null, null, null, null, null, [["hum", 19.84], ["rumble", 11.31], ["throbbing", 8.08]], null, [["music", 32.19], ["speech", 29.57], ["musical instrument", 6.89]], null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.32, 5.77, 0.04, 0.89, 0.72, 1.07, -0.23, 1.05, 5.73, 0.55, 7.28, 0.62, -0.06, 0.08, 0.14, 0.43, 0.74, 0.59, 0.53, 0.13, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/uQ84SYJmHYI_filtered.json b/annotations_filtered/uQ84SYJmHYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc931a073bd06b69efe2902386900cdc5a0cfe8 --- /dev/null +++ b/annotations_filtered/uQ84SYJmHYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [4.0, 4.45], [6.0, 6.17], [8.0, 8.34], [29.0, 29.56], [31.0, 35.28], [36.0, 37.0], [38.0, 38.91], [40.0, 40.24], [41.0, 41.62], [42.0, 43.17], [44.0, 44.47], [45.0, 64.08], [65.0, 65.5], [69.0, 86.86], [88.0, 88.7], [89.0, 90.64], [99.0, 99.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.45, 0.17, 0.34, 0.56, 4.28, 1.0, 0.91, 0.24, 0.62, 1.17, 0.47, 19.08, 0.5, 17.86, 0.7, 1.64, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/uQLeZO2Z1YQ_filtered.json b/annotations_filtered/uQLeZO2Z1YQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2485ce721b9a0a1b1cde373edfdff7efeb3e409e --- /dev/null +++ b/annotations_filtered/uQLeZO2Z1YQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [14.0, 16.75], [19.0, 30.4], [33.0, 36.24], [37.0, 38.58], [39.0, 38.7], [41.0, 122.98], [123.0, 123.01], [124.0, 137.44], [139.0, 147.95]], "keep_status": [false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 32.7, 31.58, 32.67, 0.0, 0.0, 0.0, 0.0, 32.87, 33.89], "audiomae_on_audioset": [null, [["hum", 21.19], ["mains hum", 18.31], ["music", 13.96]], [["music", 57.25], ["didgeridoo", 21.94], ["musical instrument", 6.46]], [["music", 65.97], ["theremin", 6.74], ["didgeridoo", 4.18]], null, null, null, null, [["music", 25.44], ["fly, housefly", 22.14], ["mosquito", 10.62]], [["music", 38.81], ["throbbing", 10.73], ["vehicle", 4.14]]], "duration": [0.23, 2.75, 11.4, 3.24, 1.58, -0.3, 81.98, 0.01, 13.44, 8.95]} \ No newline at end of file diff --git a/annotations_filtered/uQR_i0ydJik_filtered.json b/annotations_filtered/uQR_i0ydJik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..893e4b5816f066e6b20d493c86dfdd2dfc834ba2 --- /dev/null +++ b/annotations_filtered/uQR_i0ydJik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.2], [22.0, 23.16], [24.0, 25.2], [29.0, 29.81], [31.0, 31.75], [33.0, 34.94], [45.0, 46.06], [48.0, 48.9], [54.0, 54.21], [55.0, 55.46], [57.0, 57.3], [61.0, 61.79], [62.0, 63.27], [69.0, 68.81], [73.0, 73.74], [79.0, 79.79], [84.0, 85.53]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.09], ["tubular bells", 13.64], ["singing bowl", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.2, 1.16, 1.2, 0.81, 0.75, 1.94, 1.06, 0.9, 0.21, 0.46, 0.3, 0.79, 1.27, -0.19, 0.74, 0.79, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/uQ_nGVp6x6U_filtered.json b/annotations_filtered/uQ_nGVp6x6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1f4c656c412879f3d17789709945f30be6108f --- /dev/null +++ b/annotations_filtered/uQ_nGVp6x6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [17.0, 18.69], [21.0, 26.45], [27.0, 28.21], [29.0, 29.22], [32.0, 32.26], [37.0, 37.81], [40.0, 42.04], [46.0, 46.57], [47.0, 73.2], [74.0, 76.11], [90.0, 91.59], [96.0, 96.13], [97.0, 97.92], [102.0, 102.9], [107.0, 107.23], [113.0, 114.61], [126.0, 127.16], [129.0, 129.56], [131.0, 132.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 0.0, 54.43, 0.0, 30.09, 31.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 72.63], ["crushing", 4.7], ["animal", 1.82]], null, null, null, null, null, null, [["music", 72.56], ["drum machine", 5.87], ["electronic music", 3.18]], [["music", 74.8], ["musical instrument", 4.68], ["guitar", 4.04]], null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.69, 5.45, 1.21, 0.22, 0.26, 0.81, 2.04, 0.57, 26.2, 2.11, 1.59, 0.13, 0.92, 0.9, 0.23, 1.61, 1.16, 0.56, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/uQlKjRScXww_filtered.json b/annotations_filtered/uQlKjRScXww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf64a9e0a09d8124b9f58726bc85ef2a8fca509 --- /dev/null +++ b/annotations_filtered/uQlKjRScXww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [4.0, 4.6], [7.0, 7.75], [8.0, 8.94], [19.0, 19.26], [21.0, 22.22], [24.0, 24.54], [26.0, 26.62], [28.0, 28.65], [30.0, 30.01], [36.0, 36.68], [38.0, 38.89], [45.0, 46.75], [51.0, 51.68], [60.0, 61.5], [74.0, 74.88], [76.0, 79.35], [82.0, 81.75], [85.0, 86.53], [91.0, 91.67], [94.0, 94.76], [103.0, 103.86], [111.0, 111.43], [112.0, 113.05], [118.0, 118.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 0.6, 0.75, 0.94, 0.26, 1.22, 0.54, 0.62, 0.65, 0.01, 0.68, 0.89, 1.75, 0.68, 1.5, 0.88, 3.35, -0.25, 1.53, 0.67, 0.76, 0.86, 0.43, 1.05, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/uQpHx3lBGms_filtered.json b/annotations_filtered/uQpHx3lBGms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b55df901555e1e3b72732101158555aeff4b404c --- /dev/null +++ b/annotations_filtered/uQpHx3lBGms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.33], [19.0, 20.04], [22.0, 27.3], [31.0, 49.33], [51.0, 53.42], [60.0, 63.09], [64.0, 66.8], [68.0, 89.13]], "keep_status": [false, false, true, true, true, false, true, true], "silence_prob": [0.0, 0.0, 46.61, 36.27, 36.25, 34.13, 32.85, 28.48], "audiomae_on_audioset": [null, null, [["hum", 29.94], ["mains hum", 24.88], ["throbbing", 11.68]], [["speech", 21.67], ["mains hum", 16.87], ["hum", 14.76]], [["microwave oven", 13.34], ["hum", 12.77], ["vehicle", 8.99]], [["music", 39.12], ["mains hum", 25.84], ["hum", 14.46]], [["music", 34.07], ["mains hum", 17.01], ["hum", 10.05]], [["music", 27.81], ["speech", 18.48], ["hum", 16.09]]], "duration": [0.33, 1.04, 5.3, 18.33, 2.42, 3.09, 2.8, 21.13]} \ No newline at end of file diff --git a/annotations_filtered/uR7yS87K1tA_filtered.json b/annotations_filtered/uR7yS87K1tA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33eb59f7fccf5b6db7bf258bead489c24062e6e1 --- /dev/null +++ b/annotations_filtered/uR7yS87K1tA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [1.0, 3.25], [7.0, 9.14], [10.0, 11.23], [15.0, 15.63], [18.0, 19.13], [23.0, 22.91], [26.0, 26.16], [30.0, 30.79], [33.0, 34.53], [35.0, 37.2], [38.0, 39.61], [41.0, 41.52], [47.0, 48.02], [58.0, 58.65], [60.0, 61.99], [64.0, 65.11], [68.0, 67.71], [71.0, 72.42], [73.0, 74.21], [81.0, 81.7], [83.0, 83.54], [86.0, 86.48], [87.0, 88.23], [95.0, 95.28], [101.0, 102.12], [103.0, 104.87], [107.0, 108.78], [114.0, 113.98], [116.0, 116.55], [118.0, 119.74], [120.0, 121.78], [123.0, 123.79], [124.0, 125.41], [126.0, 126.55], [140.0, 140.37], [141.0, 142.47], [144.0, 146.15], [147.0, 147.77], [153.0, 157.27], [158.0, 160.2], [161.0, 162.55], [163.0, 164.86], [166.0, 168.47], [170.0, 171.54], [173.0, 173.74], [174.0, 179.07], [179.0, 181.35], [183.0, 183.41], [187.0, 188.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.96, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 99.99, 99.97, 0.0, 0.0, 99.96, 0.0, 0.0, 90.6, 53.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 2.25, 2.14, 1.23, 0.63, 1.13, -0.09, 0.16, 0.79, 1.53, 2.2, 1.61, 0.52, 1.02, 0.65, 1.99, 1.11, -0.29, 1.42, 1.21, 0.7, 0.54, 0.48, 1.23, 0.28, 1.12, 1.87, 1.78, -0.02, 0.55, 1.74, 1.78, 0.79, 1.41, 0.55, 0.37, 1.47, 2.15, 0.77, 4.27, 2.2, 1.55, 1.86, 2.47, 1.54, 0.74, 5.07, 2.35, 0.41, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/uRjbDsGz2tc_filtered.json b/annotations_filtered/uRjbDsGz2tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a62d7272f5431d759fd679c6ffff484782f5554a --- /dev/null +++ b/annotations_filtered/uRjbDsGz2tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.42], [8.0, 9.78], [12.0, 14.27], [25.0, 27.84], [29.0, 30.72], [32.0, 40.63], [41.0, 59.49], [60.0, 60.37], [61.0, 61.91], [63.0, 63.41], [68.0, 69.21], [72.0, 72.28], [73.0, 76.38], [81.0, 81.55], [87.0, 87.89], [91.0, 91.74], [95.0, 95.74], [99.0, 99.72], [104.0, 103.64], [107.0, 109.38], [113.0, 115.11], [116.0, 117.56], [118.0, 120.85], [122.0, 123.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [94.22, 0.0, 100.0, 97.92, 0.0, 90.95, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 45.72, 0.0, 51.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.58], ["guitar", 13.8], ["musical instrument", 11.16]], null, null, null], "duration": [2.42, 1.78, 2.27, 2.84, 1.72, 8.63, 18.49, 0.37, 0.91, 0.41, 1.21, 0.28, 3.38, 0.55, 0.89, 0.74, 0.74, 0.72, -0.36, 2.38, 2.11, 1.56, 2.85, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/uRxCU1MW8B4_filtered.json b/annotations_filtered/uRxCU1MW8B4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca765a96fdec48148d876416ac93a5594fe0f034 --- /dev/null +++ b/annotations_filtered/uRxCU1MW8B4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [4.0, 5.43], [7.0, 7.1], [8.0, 8.83], [11.0, 11.64], [17.0, 17.93], [19.0, 27.6], [28.0, 29.69], [34.0, 36.14], [40.0, 42.01], [50.0, 51.14], [53.0, 54.26], [55.0, 55.75], [59.0, 63.1], [67.0, 67.15], [67.0, 68.89], [70.0, 71.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0, 53.65, 91.13, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 59.55], ["mains hum", 13.99], ["hum", 11.86]], null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.43, 0.1, 0.83, 0.64, 0.93, 8.6, 1.69, 2.14, 2.01, 1.14, 1.26, 0.75, 4.1, 0.15, 1.89, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/uSCNsJDEf1M_filtered.json b/annotations_filtered/uSCNsJDEf1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f022e590cd6cdbd32545dc0e228f17059326c697 --- /dev/null +++ b/annotations_filtered/uSCNsJDEf1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [11.0, 15.18], [17.0, 17.54], [20.0, 34.18], [35.0, 36.9], [37.0, 42.33], [45.0, 51.51], [52.0, 53.52], [59.0, 65.21], [66.0, 66.6], [68.0, 68.88], [70.0, 71.52], [73.0, 73.82], [81.0, 90.24], [91.0, 92.13], [95.0, 99.79], [101.0, 102.54], [103.0, 104.03], [105.0, 106.86], [108.0, 115.35], [117.0, 117.66], [119.0, 119.08], [120.0, 119.77], [120.0, 123.42]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.15, 0.0, 38.95, 0.0, 34.14, 52.39, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 94.22, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 82.97], "audiomae_on_audioset": [null, [["speech", 57.92], ["sidetone", 29.03], ["music", 2.77]], null, [["crushing", 24.34], ["noise", 18.19], ["music", 10.98]], null, [["speech", 51.88], ["sidetone", 8.5], ["fart", 5.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.4], ["music", 13.78], ["effects unit", 3.86]], null, null, null, null], "duration": [1.8, 4.18, 0.54, 14.18, 1.9, 5.33, 6.51, 1.52, 6.21, 0.6, 0.88, 1.52, 0.82, 9.24, 1.13, 4.79, 1.54, 1.03, 1.86, 7.35, 0.66, 0.08, -0.23, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/uSLscJ2cY04_filtered.json b/annotations_filtered/uSLscJ2cY04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5a0c425c7ce666dca99ca7cf12269b2eab36fc5 --- /dev/null +++ b/annotations_filtered/uSLscJ2cY04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [5.0, 10.37], [15.0, 15.55], [25.0, 25.47], [28.0, 28.65], [35.0, 36.07], [44.0, 44.14], [45.0, 46.94], [58.0, 59.64], [61.0, 61.57], [64.0, 65.33], [69.0, 70.39], [74.0, 74.93], [83.0, 83.4], [89.0, 89.07], [90.0, 91.4], [101.0, 102.27], [106.0, 106.59], [111.0, 111.64], [124.0, 124.55], [125.0, 126.74], [129.0, 128.61], [158.0, 159.14], [162.0, 162.33], [168.0, 169.55], [170.0, 170.83], [173.0, 174.02], [178.0, 178.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 5.37, 0.55, 0.47, 0.65, 1.07, 0.14, 1.94, 1.64, 0.57, 1.33, 1.39, 0.93, 0.4, 0.07, 1.4, 1.27, 0.59, 0.64, 0.55, 1.74, -0.39, 1.14, 0.33, 1.55, 0.83, 1.02, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/uSMxnpecSZM_filtered.json b/annotations_filtered/uSMxnpecSZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ef6fd365fc6852ec3875118fe8761efc9eafc69 --- /dev/null +++ b/annotations_filtered/uSMxnpecSZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[100.0, 101.22], [103.0, 104.38], [104.0, 120.29], [135.0, 135.65], [140.0, 152.64], [154.0, 155.71]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 32.91, 0.0], "audiomae_on_audioset": [null, null, [["music", 75.55], ["musical instrument", 4.23], ["trombone", 4.19]], null, [["music", 27.83], ["moo", 13.8], ["cattle, bovinae", 12.49]], null], "duration": [1.22, 1.38, 16.29, 0.65, 12.64, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/uSO45koeLhk_filtered.json b/annotations_filtered/uSO45koeLhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1599080b8e72c5265eeaa6fbdf162b732a5658ef --- /dev/null +++ b/annotations_filtered/uSO45koeLhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.53], [11.0, 11.25], [24.0, 26.4], [30.0, 31.01], [33.0, 33.69], [35.0, 40.19], [43.0, 48.91], [49.0, 55.24], [57.0, 57.08], [60.0, 60.74], [62.0, 63.36], [67.0, 67.54], [69.0, 70.01], [75.0, 75.98], [77.0, 77.52], [80.0, 80.35], [94.0, 94.47], [96.0, 96.42], [99.0, 103.23], [106.0, 108.18], [110.0, 121.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 99.52, 0.0, 0.0, 99.94, 100.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.7, 37.95, 41.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.39], ["speech", 17.92], ["crowd", 4.1]], [["music", 47.61], ["musical instrument", 3.77], ["speech", 3.37]], [["music", 52.85], ["speech", 6.23], ["brass instrument", 3.86]]], "duration": [1.53, 0.25, 2.4, 1.01, 0.69, 5.19, 5.91, 6.24, 0.08, 0.74, 1.36, 0.54, 1.01, 0.98, 0.52, 0.35, 0.47, 0.42, 4.23, 2.18, 11.86]} \ No newline at end of file diff --git a/annotations_filtered/uSZi8oPRUkE_filtered.json b/annotations_filtered/uSZi8oPRUkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e07f02fec5119eb6d6ebed29b45ce9aac9db1a81 --- /dev/null +++ b/annotations_filtered/uSZi8oPRUkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.78], [19.0, 21.14], [24.0, 32.26], [33.0, 34.11], [35.0, 35.01], [36.0, 38.4], [39.0, 40.36], [42.0, 48.78], [49.0, 48.9], [52.0, 58.7], [67.0, 72.28], [74.0, 76.32], [77.0, 80.81], [87.0, 89.07], [90.0, 91.05], [94.0, 102.68], [107.0, 125.29]], "keep_status": [false, false, true, false, false, true, false, true, false, true, true, true, true, false, false, false, true], "silence_prob": [32.11, 50.76, 29.99, 0.0, 0.0, 29.26, 0.0, 37.61, 0.0, 29.98, 35.87, 48.95, 37.16, 33.34, 0.0, 32.21, 31.32], "audiomae_on_audioset": [[["music", 36.59], ["hum", 32.55], ["mains hum", 13.23]], null, [["music", 47.81], ["hum", 12.34], ["mains hum", 5.84]], null, null, [["whale vocalization", 18.75], ["music", 13.47], ["sound effect", 8.37]], null, [["music", 20.5], ["insect", 9.55], ["animal", 8.07]], null, [["fly, housefly", 17.6], ["music", 13.47], ["buzz", 12.15]], [["music", 37.0], ["throbbing", 12.87], ["hum", 12.21]], [["music", 35.73], ["speech", 12.72], ["theremin", 3.62]], [["music", 58.78], ["speech", 6.18], ["electronic music", 3.85]], [["music", 32.75], ["speech", 26.35], ["sidetone", 22.63]], null, [["music", 44.67], ["speech", 34.75], ["outside, rural or natural", 1.31]], [["music", 35.64], ["hum", 10.46], ["speech", 9.74]]], "duration": [10.78, 2.14, 8.26, 1.11, 0.01, 2.4, 1.36, 6.78, -0.1, 6.7, 5.28, 2.32, 3.81, 2.07, 1.05, 8.68, 18.29]} \ No newline at end of file diff --git a/annotations_filtered/uSkVR8Tbu8c_filtered.json b/annotations_filtered/uSkVR8Tbu8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b62a3a4f871b72053ce8102a5e9021dad5742579 --- /dev/null +++ b/annotations_filtered/uSkVR8Tbu8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 23.14]], "keep_status": [true], "silence_prob": [29.51], "audiomae_on_audioset": [[["speech", 53.57], ["music", 10.38], ["hum", 3.97]]], "duration": [11.14]} \ No newline at end of file diff --git a/annotations_filtered/uSsUoxlSADk_filtered.json b/annotations_filtered/uSsUoxlSADk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..524b3ceb105d37dec3041b9274d2af95bb9e1ff9 --- /dev/null +++ b/annotations_filtered/uSsUoxlSADk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [39.0, 39.88], [57.0, 60.18], [66.0, 72.67], [88.0, 88.7], [120.0, 120.97]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.62, 30.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.13], ["musical instrument", 9.25], ["brass instrument", 9.03]], [["music", 50.92], ["theremin", 11.15], ["effects unit", 5.09]], null, null], "duration": [0.61, 0.88, 3.18, 6.67, 0.7, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/uSuoZcrKq0I_filtered.json b/annotations_filtered/uSuoZcrKq0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc1f11e0cb57eeab8682c2cd216f67cd3229cb8 --- /dev/null +++ b/annotations_filtered/uSuoZcrKq0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 18.62], [20.0, 21.12], [24.0, 24.49], [28.0, 32.34], [34.0, 34.74], [36.0, 45.05], [50.0, 50.7], [51.0, 56.49], [57.0, 60.0], [60.0, 63.27], [64.0, 65.38], [68.0, 68.52], [70.0, 71.44], [73.0, 74.6], [76.0, 76.64], [79.0, 79.37], [80.0, 80.37], [82.0, 82.66], [84.0, 84.72], [85.0, 85.58], [86.0, 86.39], [87.0, 88.13], [90.0, 90.34], [92.0, 93.56], [94.0, 109.27], [115.0, 119.5], [122.0, 124.19]], "keep_status": [true, false, false, true, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [33.6, 0.0, 0.0, 33.89, 0.0, 35.03, 0.0, 34.55, 34.26, 39.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 31.67, 38.28], "audiomae_on_audioset": [[["hum", 29.06], ["music", 21.31], ["mains hum", 6.47]], null, null, [["hum", 29.26], ["mains hum", 25.15], ["music", 10.03]], null, [["music", 33.05], ["didgeridoo", 10.14], ["speech", 9.02]], null, [["music", 52.75], ["throbbing", 7.58], ["musical instrument", 7.06]], [["sidetone", 73.57], ["radio", 10.74], ["speech", 8.44]], [["frog", 30.79], ["throbbing", 19.63], ["croak", 12.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 53.38], ["mains hum", 22.19], ["throbbing", 3.04]], [["music", 25.77], ["noise", 24.64], ["synthesizer", 7.82]], [["hum", 27.99], ["throbbing", 23.0], ["noise", 8.26]]], "duration": [15.62, 1.12, 0.49, 4.34, 0.74, 9.05, 0.7, 5.49, 3.0, 3.27, 1.38, 0.52, 1.44, 1.6, 0.64, 0.37, 0.37, 0.66, 0.72, 0.58, 0.39, 1.13, 0.34, 1.56, 15.27, 4.5, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/uSvAfRaxSu4_filtered.json b/annotations_filtered/uSvAfRaxSu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0713a90ad040a3cf2c0cff1fda11605ffd4bfbf6 --- /dev/null +++ b/annotations_filtered/uSvAfRaxSu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.66], [16.0, 17.74], [18.0, 17.79], [18.0, 18.82], [20.0, 32.41], [36.0, 51.12], [57.0, 65.69], [67.0, 67.74], [68.0, 89.4], [90.0, 91.84], [94.0, 97.65], [98.0, 108.8], [109.0, 109.76], [111.0, 113.81], [114.0, 116.92]], "keep_status": [false, false, false, false, true, true, true, false, true, false, false, false, false, false, false], "silence_prob": [66.76, 0.0, 0.0, 0.0, 36.64, 43.18, 36.15, 0.0, 36.93, 0.0, 79.76, 85.72, 0.0, 79.76, 73.97], "audiomae_on_audioset": [null, null, null, null, [["speech", 53.04], ["electric shaver, electric razor", 4.71], ["mosquito", 4.21]], [["arrow", 19.46], ["speech", 15.12], ["creak", 10.89]], [["creak", 25.38], ["hum", 11.98], ["speech", 11.67]], null, [["speech", 12.94], ["whack, thwack", 11.36], ["hammer", 8.83]], null, null, null, null, null, null], "duration": [10.66, 1.74, -0.21, 0.82, 12.41, 15.12, 8.69, 0.74, 21.4, 1.84, 3.65, 10.8, 0.76, 2.81, 2.92]} \ No newline at end of file diff --git a/annotations_filtered/uTOoWlYv95w_filtered.json b/annotations_filtered/uTOoWlYv95w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4b45d251e7b241eebb74298bcd62fe10e332319 --- /dev/null +++ b/annotations_filtered/uTOoWlYv95w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 57.3], [61.0, 61.26], [63.0, 63.21], [64.0, 66.29], [68.0, 113.49], [117.0, 150.03]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 19.54], ["fly, housefly", 14.77], ["speech", 11.71]], null, null], "duration": [30.3, 0.26, 0.21, 2.29, 45.49, 33.03]} \ No newline at end of file diff --git a/annotations_filtered/uTUupV0ZfBk_filtered.json b/annotations_filtered/uTUupV0ZfBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..929b27300bb6dba69182464b2d91bfafc9b7040b --- /dev/null +++ b/annotations_filtered/uTUupV0ZfBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.71], [11.0, 11.45], [13.0, 14.44], [18.0, 19.58], [22.0, 23.31], [25.0, 26.06], [29.0, 30.5], [32.0, 32.49], [44.0, 45.23], [47.0, 78.22], [81.0, 108.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.82], "audiomae_on_audioset": [[["music", 31.34], ["noise", 8.27], ["fly, housefly", 4.57]], null, null, null, null, null, null, null, null, null, [["noise", 19.58], ["fly, housefly", 17.87], ["mosquito", 11.37]]], "duration": [2.71, 0.45, 1.44, 1.58, 1.31, 1.06, 1.5, 0.49, 1.23, 31.22, 27.45]} \ No newline at end of file diff --git a/annotations_filtered/uU0DNCV22dU_filtered.json b/annotations_filtered/uU0DNCV22dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74c90a61c16b5cd1888e9d73caefebe82f11184b --- /dev/null +++ b/annotations_filtered/uU0DNCV22dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.74], [23.0, 28.11], [28.0, 28.44], [29.0, 75.88], [79.0, 96.94], [100.0, 99.87]], "keep_status": [true, false, false, false, true, false], "silence_prob": [31.42, 31.02, 0.0, 0.0, 29.92, 0.0], "audiomae_on_audioset": [[["speech", 28.91], ["buzz", 11.39], ["vehicle", 8.66]], [["hum", 30.83], ["mains hum", 21.08], ["breaking", 19.03]], null, null, [["music", 32.18], ["hum", 15.36], ["throbbing", 13.16]], null], "duration": [10.74, 5.11, 0.44, 46.88, 17.94, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/uU59kXuJHhI_filtered.json b/annotations_filtered/uU59kXuJHhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2eb32efc0b07d59070845cb36ba3842de7fe5ad --- /dev/null +++ b/annotations_filtered/uU59kXuJHhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.59], [22.0, 23.04], [32.0, 33.59], [35.0, 35.13], [52.0, 52.17], [64.0, 64.83], [69.0, 68.96], [76.0, 76.01], [86.0, 90.83], [91.0, 94.04], [95.0, 95.32], [103.0, 104.04], [106.0, 107.57], [109.0, 111.42]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.57, 38.08, 0.0, 0.0, 0.0, 41.91], "audiomae_on_audioset": [[["music", 40.19], ["speech", 22.46], ["throbbing", 7.32]], null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 31.43], ["cattle, bovinae", 19.8], ["moo", 17.88]], [["music", 39.58], ["throbbing", 13.57], ["speech", 5.95]], null, null, null, [["music", 56.28], ["didgeridoo", 8.49], ["throbbing", 4.78]]], "duration": [8.59, 1.04, 1.59, 0.13, 0.17, 0.83, -0.04, 0.01, 4.83, 3.04, 0.32, 1.04, 1.57, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/uU6LIbi7NZQ_filtered.json b/annotations_filtered/uU6LIbi7NZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adba645235fe22fad2b4682e02edf3c457c5428d --- /dev/null +++ b/annotations_filtered/uU6LIbi7NZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 62.72]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [57.72]} \ No newline at end of file diff --git a/annotations_filtered/uUEpwPiiGco_filtered.json b/annotations_filtered/uUEpwPiiGco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uUEpwPiiGco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uUPHlAbAf2I_filtered.json b/annotations_filtered/uUPHlAbAf2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b9bc78be78357b504b9b2f458eea6a726cc2d71 --- /dev/null +++ b/annotations_filtered/uUPHlAbAf2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.96], [10.0, 10.62], [13.0, 13.39], [15.0, 14.99], [16.0, 19.67], [20.0, 21.32], [23.0, 25.12], [26.0, 30.4], [31.0, 32.24], [40.0, 40.46], [44.0, 47.06], [48.0, 47.76], [49.0, 49.37], [50.0, 51.09], [53.0, 55.02], [56.0, 55.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 37.78, 33.16, 0.0, 0.0, 37.08, 0.0, 0.0, 0.0, 30.17, 0.0], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 41.53], ["cattle, bovinae", 34.37], ["moo", 17.34]], null, [["speech", 34.76], ["busy signal", 28.54], ["sidetone", 17.28]], [["speech", 40.89], ["fart", 22.51], ["sidetone", 9.47]], null, null, [["whale vocalization", 13.32], ["theremin", 7.77], ["stomach rumble", 7.3]], null, null, null, [["howl", 44.05], ["canidae, dogs, wolves", 22.37], ["animal", 11.96]], null], "duration": [-0.04, 0.62, 0.39, -0.01, 3.67, 1.32, 2.12, 4.4, 1.24, 0.46, 3.06, -0.24, 0.37, 1.09, 2.02, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/uU_ftZ6EfX8_filtered.json b/annotations_filtered/uU_ftZ6EfX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b7b048b84ec67da29314d3e0c876be3003ad838 --- /dev/null +++ b/annotations_filtered/uU_ftZ6EfX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 4.5], [6.0, 6.67], [8.0, 8.61], [17.0, 18.13], [20.0, 19.82], [35.0, 37.25], [39.0, 59.44], [62.0, 77.16], [94.0, 95.18], [103.0, 104.01], [104.0, 106.44], [113.0, 113.56], [114.0, 128.58], [130.0, 130.45], [131.0, 132.44], [135.0, 145.1], [147.0, 148.41], [153.0, 157.92], [161.0, 161.32], [163.0, 162.68], [164.0, 164.13], [167.0, 168.29], [172.0, 176.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 61.87, 63.31, 0.0, 0.0, 62.78, 0.0, 61.27, 0.0, 0.0, 59.51, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 84.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.5, 0.67, 0.61, 1.13, -0.18, 2.25, 20.44, 15.16, 1.18, 1.01, 2.44, 0.56, 14.58, 0.45, 1.44, 10.1, 1.41, 4.92, 0.32, -0.32, 0.13, 1.29, 4.35]} \ No newline at end of file diff --git a/annotations_filtered/uUuTz9Hjc34_filtered.json b/annotations_filtered/uUuTz9Hjc34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bad7d72aee225bdbdd1b8f6d84dd30c4697b237d --- /dev/null +++ b/annotations_filtered/uUuTz9Hjc34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.77], [16.0, 18.81], [19.0, 18.94], [19.0, 19.08], [20.0, 21.07], [22.0, 38.47], [44.0, 45.55], [46.0, 50.35], [51.0, 71.19], [74.0, 81.58], [83.0, 86.59], [89.0, 90.05], [91.0, 93.18], [94.0, 95.07], [96.0, 106.71], [110.0, 126.82], [127.0, 134.42], [135.0, 139.18], [140.0, 165.18], [166.0, 167.58]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [33.13, 30.99, 0.0, 0.0, 0.0, 38.46, 0.0, 46.97, 40.62, 58.13, 43.98, 0.0, 71.14, 0.0, 36.28, 39.34, 56.4, 77.36, 52.86, 0.0], "audiomae_on_audioset": [[["music", 36.64], ["throbbing", 30.87], ["speech", 5.44]], [["hum", 36.99], ["throbbing", 21.0], ["mains hum", 17.6]], null, null, null, [["music", 55.77], ["hum", 16.69], ["mains hum", 10.93]], null, [["speech", 20.65], ["didgeridoo", 18.54], ["music", 17.58]], [["throbbing", 28.88], ["music", 26.57], ["hum", 21.52]], null, [["cattle, bovinae", 18.69], ["livestock, farm animals, working animals", 14.27], ["moo", 12.07]], null, null, null, [["music", 29.21], ["hum", 19.05], ["mains hum", 18.6]], [["music", 72.16], ["hum", 6.09], ["ambient music", 4.06]], null, null, null, null], "duration": [8.77, 2.81, -0.06, 0.08, 1.07, 16.47, 1.55, 4.35, 20.19, 7.58, 3.59, 1.05, 2.18, 1.07, 10.71, 16.82, 7.42, 4.18, 25.18, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/uV-u-N8RkKs_filtered.json b/annotations_filtered/uV-u-N8RkKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9619d6b7bf651340347c4473ffe0d4dd48db130 --- /dev/null +++ b/annotations_filtered/uV-u-N8RkKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.49], [14.0, 51.11], [54.0, 78.34], [79.0, 80.67]], "keep_status": [false, false, false, false], "silence_prob": [100.0, 0.0, 99.91, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [4.49, 37.11, 24.34, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/uW9Q1cm_Tnw_filtered.json b/annotations_filtered/uW9Q1cm_Tnw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81ff365df1ce3cb6be5a58e299affabb661d88ff --- /dev/null +++ b/annotations_filtered/uW9Q1cm_Tnw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.2]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.2]} \ No newline at end of file diff --git a/annotations_filtered/uWY60oFlfxs_filtered.json b/annotations_filtered/uWY60oFlfxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf423c7785def98a79a6f05d0fb908557d6a8ff --- /dev/null +++ b/annotations_filtered/uWY60oFlfxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [8.0, 10.64], [14.0, 13.93], [16.0, 17.27], [22.0, 22.74], [23.0, 30.62], [38.0, 38.4], [38.0, 38.5], [39.0, 39.36], [40.0, 40.78], [44.0, 45.15], [49.0, 49.55], [60.0, 61.18], [62.0, 62.28], [64.0, 64.72], [69.0, 69.2], [80.0, 80.52], [85.0, 85.46], [92.0, 94.61], [95.0, 95.49], [96.0, 96.31], [97.0, 97.21], [99.0, 99.87], [100.0, 101.58], [104.0, 106.61], [107.0, 108.75], [112.0, 113.05], [114.0, 116.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.31, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.23], ["wail, moan", 8.92], ["animal", 7.74]], null, null, null, null, null, null, null, null, null], "duration": [0.97, 2.64, -0.07, 1.27, 0.74, 7.62, 0.4, 0.5, 0.36, 0.78, 1.15, 0.55, 1.18, 0.28, 0.72, 0.2, 0.52, 0.46, 2.61, 0.49, 0.31, 0.21, 0.87, 1.58, 2.61, 1.75, 1.05, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/uX7CAoxBNOU_filtered.json b/annotations_filtered/uX7CAoxBNOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1cff89f254e3ea0fe41bbdc9ecdea3827cfe03 --- /dev/null +++ b/annotations_filtered/uX7CAoxBNOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 5.93], [10.0, 10.29], [13.0, 14.18], [17.0, 18.49], [23.0, 23.97], [26.0, 31.45], [33.0, 32.91], [34.0, 35.19], [36.0, 44.04], [45.0, 50.13], [51.0, 51.09], [52.0, 53.76], [55.0, 55.75], [57.0, 60.91], [62.0, 63.07], [65.0, 65.21], [67.0, 67.8], [68.0, 68.62], [70.0, 69.96], [74.0, 75.61], [76.0, 83.4], [84.0, 84.79], [86.0, 86.53], [88.0, 88.55], [91.0, 90.8], [92.0, 93.06], [99.0, 99.57], [102.0, 103.37], [104.0, 104.21], [114.0, 113.76], [116.0, 116.58], [121.0, 121.2], [124.0, 124.09], [126.0, 126.25], [127.0, 128.93], [129.0, 129.93], [132.0, 132.68], [134.0, 141.24], [144.0, 144.05], [145.0, 146.06], [151.0, 151.14], [152.0, 153.28], [157.0, 159.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 33.48, 38.74, 0.0, 0.0, 0.0, 32.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 33.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["beatboxing", 45.63], ["speech", 38.85], ["music", 7.33]], [["music", 59.63], ["drum", 7.51], ["musical instrument", 7.12]], null, null, null, [["music", 19.35], ["theremin", 11.56], ["clapping", 10.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.9], ["synthesizer", 15.21], ["didgeridoo", 6.83]], null, null, null, null, [["speech", 54.13], ["fart", 29.58], ["boing", 4.22]]], "duration": [0.57, 1.93, 0.29, 1.18, 1.49, 0.97, 5.45, -0.09, 1.19, 8.04, 5.13, 0.09, 1.76, 0.75, 3.91, 1.07, 0.21, 0.8, 0.62, -0.04, 1.61, 7.4, 0.79, 0.53, 0.55, -0.2, 1.06, 0.57, 1.37, 0.21, -0.24, 0.58, 0.2, 0.09, 0.25, 1.93, 0.93, 0.68, 7.24, 0.05, 1.06, 0.14, 1.28, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/uXG9v1_X8jc_filtered.json b/annotations_filtered/uXG9v1_X8jc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a7b1932075fe35f16ff6b6dd7d2465718b2364 --- /dev/null +++ b/annotations_filtered/uXG9v1_X8jc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [9.0, 10.37], [11.0, 12.04], [14.0, 14.23], [15.0, 16.31], [18.0, 19.63], [23.0, 23.73], [27.0, 29.76], [32.0, 34.48], [38.0, 43.28], [46.0, 49.2], [50.0, 56.22], [57.0, 64.96], [67.0, 66.95], [67.0, 71.41], [72.0, 72.69], [74.0, 76.11], [78.0, 87.56], [88.0, 95.5], [97.0, 98.1], [98.0, 100.08], [105.0, 106.15], [108.0, 109.07], [119.0, 120.65], [122.0, 123.04], [124.0, 126.74], [129.0, 164.94], [166.0, 166.55]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 54.36, 49.68, 57.72, 48.39, 56.63, 0.0, 31.62, 0.0, 98.8, 80.46, 51.82, 0.0, 54.43, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fly, housefly", 33.25], ["insect", 25.07], ["speech", 12.63]], null, [["music", 55.51], ["musical instrument", 7.15], ["guitar", 5.45]], null, [["hum", 34.75], ["mains hum", 27.91], ["music", 8.61]], null, null, [["music", 29.91], ["throbbing", 5.45], ["hum", 5.33]], null, null, null, null, null, null, null, null, null, null, [["hum", 14.41], ["fly, housefly", 11.3], ["insect", 10.09]], null, null], "duration": [0.97, 1.37, 1.04, 0.23, 1.31, 1.63, 0.73, 2.76, 2.48, 5.28, 3.2, 6.22, 7.96, -0.05, 4.41, 0.69, 2.11, 9.56, 7.5, 1.1, 2.08, 1.15, 1.07, 1.65, 1.04, 2.74, 35.94, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/uXsQ8IIi6YI_filtered.json b/annotations_filtered/uXsQ8IIi6YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e10367afe1b31e1d7f7d4b140b2225c0726862d4 --- /dev/null +++ b/annotations_filtered/uXsQ8IIi6YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [12.0, 13.14], [22.0, 22.22], [24.0, 25.41], [26.0, 27.82], [28.0, 30.32], [38.0, 38.74], [43.0, 43.23], [46.0, 51.44], [51.0, 51.61], [52.0, 80.35], [81.0, 86.0], [87.0, 88.92], [91.0, 91.77], [96.0, 97.38], [101.0, 101.95], [103.0, 104.79], [109.0, 111.69], [119.0, 119.16]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 43.05, 0.0, 44.04, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 39.1], ["music", 17.76], ["animal", 7.01]], null, [["music", 52.17], ["speech", 20.43], ["tabla", 3.13]], null, null, null, null, null, null, null, null], "duration": [1.06, 1.14, 0.22, 1.41, 1.82, 2.32, 0.74, 0.23, 5.44, 0.61, 28.35, 5.0, 1.92, 0.77, 1.38, 0.95, 1.79, 2.69, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/uXyvjZa6x2o_filtered.json b/annotations_filtered/uXyvjZa6x2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..121b9c616026e91b2fd2df6ed88a06cef2bec744 --- /dev/null +++ b/annotations_filtered/uXyvjZa6x2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [8.0, 10.03], [12.0, 13.44], [14.0, 21.05], [22.0, 24.12], [26.0, 26.65], [29.0, 30.27], [32.0, 33.67], [36.0, 36.93], [38.0, 38.5], [40.0, 49.2], [50.0, 53.59], [54.0, 55.26], [57.0, 57.45], [59.0, 60.76], [63.0, 64.02], [66.0, 66.63], [69.0, 69.92], [75.0, 76.13], [80.0, 81.21], [84.0, 84.67], [87.0, 87.99], [88.0, 91.07], [92.0, 94.44], [96.0, 96.18], [98.0, 98.22], [99.0, 99.99], [103.0, 103.55], [105.0, 107.01], [110.0, 111.01], [113.0, 115.05], [117.0, 118.49], [120.0, 123.74], [125.0, 127.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.36, 0.0, 67.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.22, 96.54, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 65.44, 0.0, 54.3, 85.54], "audiomae_on_audioset": [null, [["cattle, bovinae", 27.1], ["livestock, farm animals, working animals", 25.45], ["moo", 19.42]], null, null, null, null, null, null, null, null, [["hum", 42.91], ["speech", 17.74], ["mains hum", 13.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 2.03, 1.44, 7.05, 2.12, 0.65, 1.27, 1.67, 0.93, 0.5, 9.2, 3.59, 1.26, 0.45, 1.76, 1.02, 0.63, 0.92, 1.13, 1.21, 0.67, 0.99, 3.07, 2.44, 0.18, 0.22, 0.99, 0.55, 2.01, 1.01, 2.05, 1.49, 3.74, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/uYV11ZwpaSQ_filtered.json b/annotations_filtered/uYV11ZwpaSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47fb35b5dc3c9eb84156a6003a75ee61dcce8540 --- /dev/null +++ b/annotations_filtered/uYV11ZwpaSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.47], [9.0, 10.2], [13.0, 31.29], [32.0, 42.2], [43.0, 48.71], [50.0, 62.95], [68.0, 68.18], [69.0, 76.77], [88.0, 93.97], [97.0, 98.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.45, 79.76, 85.54, 69.61, 0.0, 68.15, 88.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 1.2, 18.29, 10.2, 5.71, 12.95, 0.18, 7.77, 5.97, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/uZ0YGah7MsE_filtered.json b/annotations_filtered/uZ0YGah7MsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24603ce9f8f519d3170bed053ee1d901da3c37cb --- /dev/null +++ b/annotations_filtered/uZ0YGah7MsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.13], [0.0, 1.22], [2.0, 1.75], [2.0, 7.05], [8.0, 8.14], [16.0, 16.8], [20.0, 23.01], [29.0, 29.91], [35.0, 37.72], [46.0, 50.79], [51.0, 53.18], [55.0, 56.66], [60.0, 60.86], [63.0, 65.99], [67.0, 67.66], [70.0, 70.6], [71.0, 71.61], [72.0, 75.84], [78.0, 78.61], [79.0, 81.16], [84.0, 85.65], [87.0, 87.2], [89.0, 91.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 65.44, 0.0, 75.72, 94.52, 78.21, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 99.98, 0.0, 62.58, 0.0, 0.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 1.22, -0.25, 5.05, 0.14, 0.8, 3.01, 0.91, 2.72, 4.79, 2.18, 1.66, 0.86, 2.99, 0.66, 0.6, 0.61, 3.84, 0.61, 2.16, 1.65, 0.2, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/uZWDke-bpmc_filtered.json b/annotations_filtered/uZWDke-bpmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6bf0eacddcd6a33b82262469c80f0e3c7ac7c3c --- /dev/null +++ b/annotations_filtered/uZWDke-bpmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 66.31], [69.0, 73.53], [79.0, 89.48], [99.0, 99.27], [101.0, 104.89]], "keep_status": [false, false, true, false, false], "silence_prob": [33.68, 30.12, 32.21, 0.0, 31.12], "audiomae_on_audioset": [[["hum", 41.59], ["throbbing", 40.42], ["mains hum", 7.58]], [["music", 42.94], ["speech", 20.74], ["hum", 7.69]], [["music", 31.96], ["speech", 20.13], ["hum", 14.58]], null, [["music", 33.0], ["mains hum", 21.28], ["hum", 15.87]]], "duration": [28.31, 4.53, 10.48, 0.27, 3.89]} \ No newline at end of file diff --git a/annotations_filtered/uZgo9g8v76U_filtered.json b/annotations_filtered/uZgo9g8v76U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0436dfb9db5f567fce5a477eb28a22e9508d211 --- /dev/null +++ b/annotations_filtered/uZgo9g8v76U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.88], [25.0, 29.94], [33.0, 34.03], [44.0, 63.0], [67.0, 67.73]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 30.58, 0.0, 29.91, 0.0], "audiomae_on_audioset": [null, [["music", 85.97], ["reggae", 2.03], ["singing", 0.95]], null, [["music", 90.49], ["howl", 0.79], ["rock and roll", 0.71]], null], "duration": [-0.12, 4.94, 1.03, 19.0, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/uZpvHkGMn5k_filtered.json b/annotations_filtered/uZpvHkGMn5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c731ed2545cc0d9e70824ecad087e67408078436 --- /dev/null +++ b/annotations_filtered/uZpvHkGMn5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[131.0, 141.22], [142.0, 141.78], [145.0, 145.74], [146.0, 151.11], [153.0, 155.21], [161.0, 167.44]], "keep_status": [true, false, false, true, true, true], "silence_prob": [32.02, 0.0, 0.0, 30.15, 30.08, 30.01], "audiomae_on_audioset": [[["speech", 35.7], ["music", 18.71], ["electric shaver, electric razor", 9.21]], null, null, [["music", 60.42], ["didgeridoo", 3.44], ["speech", 3.01]], [["music", 37.53], ["zipper (clothing)", 13.84], ["musical instrument", 7.4]], [["music", 41.89], ["speech", 9.94], ["electric shaver, electric razor", 8.41]]], "duration": [10.22, -0.22, 0.74, 5.11, 2.21, 6.44]} \ No newline at end of file diff --git a/annotations_filtered/u_4L7Dx1rIg_filtered.json b/annotations_filtered/u_4L7Dx1rIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32d7f5177578ed78736ce4523f795d6b0b0a9e30 --- /dev/null +++ b/annotations_filtered/u_4L7Dx1rIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 15.72], [19.0, 20.78], [24.0, 28.21], [29.0, 30.21], [34.0, 34.03], [34.0, 35.18], [36.0, 38.91], [41.0, 40.93], [43.0, 44.47], [51.0, 51.54], [53.0, 55.46], [59.0, 59.12], [61.0, 61.3], [65.0, 65.5], [66.0, 67.66], [70.0, 70.83], [72.0, 72.64], [74.0, 74.8], [76.0, 76.94], [78.0, 78.58], [88.0, 91.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.28, 1.78, 4.21, 1.21, 0.03, 1.18, 2.91, -0.07, 1.47, 0.54, 2.46, 0.12, 0.3, 0.5, 1.66, 0.83, 0.64, 0.8, 0.94, 0.58, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/u_Bfpbz3owc_filtered.json b/annotations_filtered/u_Bfpbz3owc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d0fc12e4e67e62e8527dadee75285f652669f7 --- /dev/null +++ b/annotations_filtered/u_Bfpbz3owc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 4.58], [9.0, 10.22], [11.0, 11.75], [20.0, 20.7], [26.0, 26.37], [31.0, 32.78], [33.0, 33.05], [36.0, 37.62], [39.0, 39.43], [46.0, 46.6], [50.0, 50.38], [56.0, 57.01], [59.0, 59.21], [61.0, 61.7], [63.0, 63.93], [65.0, 65.5], [69.0, 69.15], [82.0, 83.0], [85.0, 86.37], [88.0, 88.57], [90.0, 90.41], [92.0, 92.01], [107.0, 107.65], [108.0, 109.02], [114.0, 114.32], [116.0, 115.94], [118.0, 118.52], [122.0, 123.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.58, 1.22, 0.75, 0.7, 0.37, 1.78, 0.05, 1.62, 0.43, 0.6, 0.38, 1.01, 0.21, 0.7, 0.93, 0.5, 0.15, 1.0, 1.37, 0.57, 0.41, 0.01, 0.65, 1.02, 0.32, -0.06, 0.52, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/u_jemmhoj0Q_filtered.json b/annotations_filtered/u_jemmhoj0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db609cdfc0928c455898c87bc4c4d0b45f05a85d --- /dev/null +++ b/annotations_filtered/u_jemmhoj0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [5.0, 6.62], [16.0, 16.55], [35.0, 36.95], [38.0, 42.04], [44.0, 45.0], [46.0, 60.52], [62.0, 64.49], [65.0, 65.64], [70.0, 70.34], [77.0, 77.08], [82.0, 83.15], [99.0, 99.05], [100.0, 102.29], [103.0, 103.4], [104.0, 104.63], [106.0, 106.25]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.25, 0.0, 31.07, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 27.23], ["speech", 16.36], ["buzz", 5.99]], null, [["music", 53.27], ["buzz", 39.28], ["electric shaver, electric razor", 1.75]], [["music", 31.27], ["moo", 7.38], ["speech", 6.53]], null, null, null, null, null, null, null, null, null], "duration": [0.98, 1.62, 0.55, 1.95, 4.04, 1.0, 14.52, 2.49, 0.64, 0.34, 0.08, 1.15, 0.05, 2.29, 0.4, 0.63, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/u_n1SEwWmYc_filtered.json b/annotations_filtered/u_n1SEwWmYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e82657e480aca04f35e90c91d03c55f19fccb77f --- /dev/null +++ b/annotations_filtered/u_n1SEwWmYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [6.0, 6.35], [8.0, 8.43], [10.0, 10.66], [17.0, 17.74], [23.0, 22.67], [27.0, 28.26], [41.0, 43.38], [44.0, 45.13], [50.0, 53.74], [54.0, 54.4], [57.0, 59.36], [63.0, 62.83], [64.0, 67.8], [69.0, 69.72], [74.0, 73.7], [76.0, 76.35], [78.0, 80.16], [100.0, 104.33], [105.0, 105.24], [105.0, 106.74], [107.0, 125.19], [130.0, 131.28], [132.0, 141.94], [143.0, 148.93], [149.0, 151.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 60.79, 0.0, 53.65, 0.0, 33.01, 0.0, 0.0, 0.0, 42.33, 29.93, 0.0, 0.0, 29.45, 0.0, 29.23, 55.25, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.65], ["music", 14.05], ["effects unit", 5.23]], null, null, null, [["music", 68.02], ["speech", 6.16], ["musical instrument", 2.82]], [["speech", 46.49], ["music", 22.61], ["explosion", 6.33]], null, null, [["speech", 44.55], ["music", 13.82], ["sound effect", 5.52]], null, [["speech", 23.04], ["music", 20.82], ["explosion", 19.01]], null, null], "duration": [1.05, 0.35, 0.43, 0.66, 0.74, -0.33, 1.26, 2.38, 1.13, 3.74, 0.4, 2.36, -0.17, 3.8, 0.72, -0.3, 0.35, 2.16, 4.33, 0.24, 1.74, 18.19, 1.28, 9.94, 5.93, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/u_z2ttNkL24_filtered.json b/annotations_filtered/u_z2ttNkL24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4b6b996ace2e0e6881f79a2eb6a3eadf5d1b84a --- /dev/null +++ b/annotations_filtered/u_z2ttNkL24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.23], [14.0, 14.57], [15.0, 16.11], [21.0, 26.52], [27.0, 31.53], [33.0, 33.67], [38.0, 38.28], [40.0, 40.71], [41.0, 42.94], [46.0, 50.01], [52.0, 52.61], [53.0, 53.89], [54.0, 54.53], [56.0, 57.79], [60.0, 61.13], [63.0, 64.29], [67.0, 68.18], [69.0, 70.19], [71.0, 73.11], [77.0, 77.57], [82.0, 87.51], [92.0, 96.75], [103.0, 103.65], [108.0, 108.06], [108.0, 110.25], [111.0, 112.4], [116.0, 116.19], [118.0, 119.28], [121.0, 122.0], [122.0, 123.23], [128.0, 135.51], [136.0, 143.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.44, 75.23, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 54.7, 47.5, 0.0, 0.0, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 82.43], "audiomae_on_audioset": [null, null, null, [["mains hum", 54.5], ["hum", 23.21], ["door", 5.72]], null, null, null, null, null, [["mains hum", 28.24], ["speech", 20.75], ["hum", 19.72]], null, null, null, null, null, null, null, null, null, null, null, [["music", 64.79], ["effects unit", 4.1], ["musical instrument", 3.4]], null, null, [["tuning fork", 33.13], ["singing bowl", 17.31], ["speech", 14.56]], null, null, null, null, null, null, null], "duration": [0.23, 0.57, 1.11, 5.52, 4.53, 0.67, 0.28, 0.71, 1.94, 4.01, 0.61, 0.89, 0.53, 1.79, 1.13, 1.29, 1.18, 1.19, 2.11, 0.57, 5.51, 4.75, 0.65, 0.06, 2.25, 1.4, 0.19, 1.28, 1.0, 1.23, 7.51, 7.73]} \ No newline at end of file diff --git a/annotations_filtered/uaDgwjVu8ik_filtered.json b/annotations_filtered/uaDgwjVu8ik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbcfbd96684abecae7559e909c03e690faab452f --- /dev/null +++ b/annotations_filtered/uaDgwjVu8ik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 77.04], [80.0, 139.16], [140.0, 140.76]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [61.04, 59.16, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/uaLxw2PDnmk_filtered.json b/annotations_filtered/uaLxw2PDnmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e9bbdd42cb2f833d558ee38bbfad0c7cfb7f8da --- /dev/null +++ b/annotations_filtered/uaLxw2PDnmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 34.18], [36.0, 78.88], [80.0, 79.95], [89.0, 119.25], [132.0, 132.14], [137.0, 137.57], [139.0, 139.62], [141.0, 141.62], [143.0, 145.96], [150.0, 150.79], [159.0, 164.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.06, 0.0, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 66.3], ["musical instrument", 3.7], ["grunt", 3.11]], null, [["music", 23.23], ["speech", 20.38], ["animal", 6.22]]], "duration": [24.18, 42.88, -0.05, 30.25, 0.14, 0.57, 0.62, 0.62, 2.96, 0.79, 5.61]} \ No newline at end of file diff --git a/annotations_filtered/uabEMv5Sr68_filtered.json b/annotations_filtered/uabEMv5Sr68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b97298edd6aa3667e42350a56cf0f004d78edf7 --- /dev/null +++ b/annotations_filtered/uabEMv5Sr68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [16.0, 18.17], [20.0, 21.69], [22.0, 24.07], [25.0, 26.28], [27.0, 27.31], [29.0, 29.3], [30.0, 30.16], [34.0, 34.37], [41.0, 45.05], [45.0, 51.51], [53.0, 53.64], [55.0, 55.66], [58.0, 59.61], [60.0, 60.44], [61.0, 61.3], [62.0, 62.85], [63.0, 63.76], [64.0, 64.56], [65.0, 67.64], [68.0, 68.67], [71.0, 71.49], [72.0, 72.1], [73.0, 74.17], [77.0, 80.13], [81.0, 82.66], [84.0, 85.08], [87.0, 89.73], [91.0, 91.2], [92.0, 92.65], [93.0, 94.74], [95.0, 95.66], [97.0, 97.68], [98.0, 99.96], [101.0, 105.46], [106.0, 107.87], [109.0, 114.83], [115.0, 116.72], [118.0, 120.06], [122.0, 122.59], [124.0, 124.58], [128.0, 129.12], [130.0, 131.43], [133.0, 134.82], [137.0, 138.33], [140.0, 143.36], [144.0, 145.93], [146.0, 147.93], [149.0, 150.08], [151.0, 151.85], [153.0, 155.78], [157.0, 164.19], [165.0, 166.36], [167.0, 169.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 99.87, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.65, 67.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 2.17, 1.69, 2.07, 1.28, 0.31, 0.3, 0.16, 0.37, 4.05, 6.51, 0.64, 0.66, 1.61, 0.44, 0.3, 0.85, 0.76, 0.56, 2.64, 0.67, 0.49, 0.1, 1.17, 3.13, 1.66, 1.08, 2.73, 0.2, 0.65, 1.74, 0.66, 0.68, 1.96, 4.46, 1.87, 5.83, 1.72, 2.06, 0.59, 0.58, 1.12, 1.43, 1.82, 1.33, 3.36, 1.93, 1.93, 1.08, 0.85, 2.78, 7.19, 1.36, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/uat-LZ3t7i4_filtered.json b/annotations_filtered/uat-LZ3t7i4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da6289a0ae96b8e170bc8b7633910e296e2a5543 --- /dev/null +++ b/annotations_filtered/uat-LZ3t7i4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.59], [14.0, 14.05], [15.0, 17.95], [19.0, 30.89], [32.0, 46.08], [47.0, 47.66], [48.0, 65.94], [67.0, 85.38], [86.0, 115.87], [117.0, 116.83], [118.0, 118.59]], "keep_status": [false, false, true, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 39.27, 36.34, 37.21, 0.0, 37.67, 37.93, 35.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["dog", 24.68], ["animal", 20.71], ["domestic animals, pets", 11.78]], [["music", 27.88], ["hum", 14.19], ["whack, thwack", 6.69]], [["music", 58.3], ["speech", 10.01], ["fart", 7.78]], null, [["music", 53.41], ["hum", 17.4], ["speech", 9.33]], [["music", 38.58], ["didgeridoo", 11.9], ["musical instrument", 6.72]], [["hum", 35.95], ["throbbing", 17.57], ["music", 15.34]], null, null], "duration": [-0.41, 0.05, 2.95, 11.89, 14.08, 0.66, 17.94, 18.38, 29.87, -0.17, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/ubgR8CKyzYw_filtered.json b/annotations_filtered/ubgR8CKyzYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a7eb9d6817b48ca308826931a59df956d844e0d --- /dev/null +++ b/annotations_filtered/ubgR8CKyzYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.72], [18.0, 19.65], [25.0, 28.19], [29.0, 29.98], [31.0, 40.19], [42.0, 72.45], [73.0, 76.17], [76.0, 80.67], [81.0, 83.51], [88.0, 89.09], [92.0, 92.28], [93.0, 93.85], [94.0, 94.73], [97.0, 99.67], [100.0, 100.92], [104.0, 104.4], [105.0, 105.54], [106.0, 106.74], [108.0, 108.04], [108.0, 110.2], [111.0, 111.62], [113.0, 113.34], [116.0, 116.99]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.83, 0.0, 30.06, 0.0, 98.1, 99.73, 48.65, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 73.02], ["didgeridoo", 5.48], ["cacophony", 3.5]], null, null, null, [["sidetone", 10.79], ["music", 10.09], ["busy signal", 4.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.65, 3.19, 0.98, 9.19, 30.45, 3.17, 4.67, 2.51, 1.09, 0.28, 0.85, 0.73, 2.67, 0.92, 0.4, 0.54, 0.74, 0.04, 2.2, 0.62, 0.34, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/uc0l3djxQ5Y_filtered.json b/annotations_filtered/uc0l3djxQ5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e644d21154efaa3727ff258255ac9465b03af01 --- /dev/null +++ b/annotations_filtered/uc0l3djxQ5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 96.99], [100.0, 103.99], [106.0, 108.24], [116.0, 116.46]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 40.09, 55.89, 0.0], "audiomae_on_audioset": [null, [["music", 44.36], ["speech", 12.55], ["throbbing", 8.21]], null, null], "duration": [0.99, 3.99, 2.24, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/ucBnN5N2fn8_filtered.json b/annotations_filtered/ucBnN5N2fn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4b4d6d72eb6769198fadeb671ec12dd408c11c --- /dev/null +++ b/annotations_filtered/ucBnN5N2fn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.78], [15.0, 20.83], [21.0, 23.19], [26.0, 30.59], [32.0, 38.03], [42.0, 42.52], [44.0, 43.97], [45.0, 53.62], [57.0, 57.35], [59.0, 59.81], [62.0, 63.29], [64.0, 63.98], [65.0, 66.51], [67.0, 68.25], [70.0, 70.7], [71.0, 76.23], [77.0, 78.7], [80.0, 80.49], [82.0, 82.31], [83.0, 84.35], [85.0, 87.42], [88.0, 88.97], [92.0, 92.48], [94.0, 94.37], [95.0, 96.13], [97.0, 98.34], [102.0, 102.66], [105.0, 105.95], [109.0, 109.16], [110.0, 113.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.64, 100.0, 91.13, 100.0, 99.52, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.78, 5.83, 2.19, 4.59, 6.03, 0.52, -0.03, 8.62, 0.35, 0.81, 1.29, -0.02, 1.51, 1.25, 0.7, 5.23, 1.7, 0.49, 0.31, 1.35, 2.42, 0.97, 0.48, 0.37, 1.13, 1.34, 0.66, 0.95, 0.16, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/ucQmXLgGIVA_filtered.json b/annotations_filtered/ucQmXLgGIVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37d8e38691e2cfda4aabd9bbcb5acf2ed899439a --- /dev/null +++ b/annotations_filtered/ucQmXLgGIVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.61], [13.0, 14.49], [15.0, 18.59], [25.0, 25.57], [29.0, 29.42], [31.0, 31.18], [32.0, 32.59], [34.0, 34.01], [35.0, 35.29], [36.0, 36.41], [51.0, 55.27], [56.0, 60.25], [62.0, 70.29], [75.0, 75.34], [78.0, 78.95], [86.0, 89.28], [95.0, 97.58], [99.0, 102.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [99.21, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 100.0, 44.81, 0.0, 0.0, 99.91, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["arrow", 19.95], ["thump, thud", 12.27], ["hum", 9.09]], null, null, null, null, null], "duration": [4.61, 1.49, 3.59, 0.57, 0.42, 0.18, 0.59, 0.01, 0.29, 0.41, 4.27, 4.25, 8.29, 0.34, 0.95, 3.28, 2.58, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/ucYwV7EWIRU_filtered.json b/annotations_filtered/ucYwV7EWIRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce796ac3a49628f773ddbbec27b1ae602dc75efb --- /dev/null +++ b/annotations_filtered/ucYwV7EWIRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.84], [25.0, 27.5], [31.0, 60.51], [61.0, 76.0], [80.0, 81.57]], "keep_status": [false, true, false, true, false], "silence_prob": [0.0, 48.39, 30.22, 30.74, 0.0], "audiomae_on_audioset": [null, [["music", 35.41], ["fly, housefly", 8.54], ["musical instrument", 7.76]], [["music", 34.81], ["speech", 33.92], ["explosion", 4.18]], [["music", 34.44], ["speech", 10.23], ["electric shaver, electric razor", 6.4]], null], "duration": [-0.16, 2.5, 29.51, 15.0, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/ucgU2DJlBiw_filtered.json b/annotations_filtered/ucgU2DJlBiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6253495186e120eff1e3ce344bdeedb7289acc4f --- /dev/null +++ b/annotations_filtered/ucgU2DJlBiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.64], [23.0, 27.48], [32.0, 32.32], [41.0, 41.61], [42.0, 43.88], [50.0, 51.93], [54.0, 56.79], [60.0, 60.05], [61.0, 61.7], [66.0, 67.39], [69.0, 69.55], [70.0, 71.37], [73.0, 73.08], [74.0, 75.0], [86.0, 87.59], [89.0, 89.4], [98.0, 98.36], [99.0, 99.99], [101.0, 102.22], [104.0, 105.88], [109.0, 109.56], [117.0, 117.64], [119.0, 121.83], [123.0, 124.61], [128.0, 130.92], [132.0, 133.24]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 31.09, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.62, 0.0, 41.24, 0.0], "audiomae_on_audioset": [null, [["music", 36.33], ["musical instrument", 13.09], ["synthesizer", 3.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 21.24], ["heart sounds, heartbeat", 14.65], ["speech", 7.16]], null, [["whale vocalization", 31.78], ["speech", 11.48], ["hum", 10.23]], null], "duration": [0.64, 4.48, 0.32, 0.61, 1.88, 1.93, 2.79, 0.05, 0.7, 1.39, 0.55, 1.37, 0.08, 1.0, 1.59, 0.4, 0.36, 0.99, 1.22, 1.88, 0.56, 0.64, 2.83, 1.61, 2.92, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/uciRaLsFmfM_filtered.json b/annotations_filtered/uciRaLsFmfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddee2025c8673fca6ebf31df98d9973dd0077b6e --- /dev/null +++ b/annotations_filtered/uciRaLsFmfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.05], [32.0, 35.4], [36.0, 39.99], [40.0, 43.43], [44.0, 46.18], [47.0, 60.12], [60.0, 60.49], [61.0, 61.96], [66.0, 66.88], [74.0, 75.19], [78.0, 78.58], [87.0, 88.26], [96.0, 96.33], [112.0, 117.42], [118.0, 119.2], [124.0, 130.84], [133.0, 134.27], [135.0, 135.82]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 71.43, 67.13, 63.96, 84.07, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 0.0, 28.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 56.53], ["synthesizer", 4.72], ["hum", 4.55]], null, null, null, null, null, null, null, [["music", 57.75], ["hum", 13.8], ["mains hum", 8.72]], null, [["music", 19.62], ["hum", 17.25], ["throbbing", 11.9]], null, null], "duration": [0.05, 3.4, 3.99, 3.43, 2.18, 13.12, 0.49, 0.96, 0.88, 1.19, 0.58, 1.26, 0.33, 5.42, 1.2, 6.84, 1.27, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/ucikAqewZL4_filtered.json b/annotations_filtered/ucikAqewZL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8bc2490b55605e20aee3cfa4f6ef405c9ca00be --- /dev/null +++ b/annotations_filtered/ucikAqewZL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.07]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.07]} \ No newline at end of file diff --git a/annotations_filtered/uckdiNJ10LE_filtered.json b/annotations_filtered/uckdiNJ10LE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uckdiNJ10LE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ud1tMFmSp2I_filtered.json b/annotations_filtered/ud1tMFmSp2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a5a118dbcfc0616920cdabfdf44791909ddb2fa --- /dev/null +++ b/annotations_filtered/ud1tMFmSp2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [5.0, 5.09], [9.0, 9.22], [10.0, 10.61], [13.0, 13.64], [15.0, 15.87], [17.0, 17.37], [19.0, 19.14], [20.0, 20.04], [21.0, 21.34], [22.0, 22.96], [24.0, 24.98], [27.0, 28.31], [30.0, 31.14], [33.0, 34.43], [37.0, 37.23], [42.0, 43.46], [46.0, 46.68], [50.0, 49.99], [51.0, 51.68], [52.0, 52.2], [53.0, 53.65], [55.0, 55.93], [57.0, 58.53], [60.0, 59.8], [61.0, 62.28], [65.0, 65.77], [72.0, 72.52], [73.0, 74.38], [77.0, 77.67], [78.0, 78.73], [80.0, 80.5], [88.0, 88.08], [96.0, 96.3], [98.0, 98.39], [100.0, 100.21], [103.0, 104.08], [105.0, 105.14], [106.0, 106.54], [109.0, 110.69], [115.0, 115.21], [116.0, 116.51], [124.0, 124.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.09, 0.22, 0.61, 0.64, 0.87, 0.37, 0.14, 0.04, 0.34, 0.96, 0.98, 1.31, 1.14, 1.43, 0.23, 1.46, 0.68, -0.01, 0.68, 0.2, 0.65, 0.93, 1.53, -0.2, 1.28, 0.77, 0.52, 1.38, 0.67, 0.73, 0.5, 0.08, 0.3, 0.39, 0.21, 1.08, 0.14, 0.54, 1.69, 0.21, 0.51, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/ud1zpHW3ito_filtered.json b/annotations_filtered/ud1zpHW3ito_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66475ec141d783e070b1735307230e3df91e2d50 --- /dev/null +++ b/annotations_filtered/ud1zpHW3ito_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 73.31], [74.0, 116.18], [117.0, 118.1], [119.0, 120.9], [121.0, 124.85], [126.0, 127.94], [129.0, 130.49]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [89.9, 0.0, 0.0, 0.0, 55.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [12.31, 42.18, 1.1, 1.9, 3.85, 1.94, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/ud421fnpmYs_filtered.json b/annotations_filtered/ud421fnpmYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..794b307a68e3a29cd9ebe2248df66f01802c0a18 --- /dev/null +++ b/annotations_filtered/ud421fnpmYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.33], [8.0, 8.67], [11.0, 10.72], [20.0, 21.07], [24.0, 24.39], [24.0, 25.14], [28.0, 29.03], [31.0, 32.78], [33.0, 35.68], [36.0, 36.44], [37.0, 38.38], [46.0, 46.74], [48.0, 48.74], [52.0, 52.62], [53.0, 54.73], [60.0, 60.67], [64.0, 64.05], [68.0, 68.27], [73.0, 73.75], [78.0, 79.3], [80.0, 83.24], [85.0, 84.74], [91.0, 91.89], [94.0, 94.58], [97.0, 97.04], [98.0, 100.38], [106.0, 106.47], [108.0, 107.99], [109.0, 109.56], [112.0, 113.22], [114.0, 115.35], [116.0, 116.6], [118.0, 118.86], [124.0, 127.14], [128.0, 131.45], [132.0, 134.4], [136.0, 136.29], [138.0, 141.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 79.76, 60.6, 0.0, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 32.37], ["explosion", 28.08], ["gunshot, gunfire", 17.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.51], ["thunk", 9.54], ["explosion", 6.59]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.67, -0.28, 1.07, 0.39, 1.14, 1.03, 1.78, 2.68, 0.44, 1.38, 0.74, 0.74, 0.62, 1.73, 0.67, 0.05, 0.27, 0.75, 1.3, 3.24, -0.26, 0.89, 0.58, 0.04, 2.38, 0.47, -0.01, 0.56, 1.22, 1.35, 0.6, 0.86, 3.14, 3.45, 2.4, 0.29, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/udHB3tftPz4_filtered.json b/annotations_filtered/udHB3tftPz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f489dbda8c72c82bff33a8d146e178795d3aff06 --- /dev/null +++ b/annotations_filtered/udHB3tftPz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [6.0, 6.27], [9.0, 8.94], [13.0, 13.63], [15.0, 21.63], [34.0, 34.82], [35.0, 36.19], [45.0, 45.84], [48.0, 49.49], [57.0, 57.06], [57.0, 60.69], [61.0, 61.79], [70.0, 73.8], [76.0, 76.55], [80.0, 82.85], [83.0, 84.99], [86.0, 86.02], [87.0, 87.93], [89.0, 90.04], [91.0, 91.86], [93.0, 96.38], [100.0, 110.1], [110.0, 110.96], [113.0, 114.49], [117.0, 117.81], [119.0, 119.67], [122.0, 122.89], [125.0, 128.85]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.69, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 0.0, 34.08, 0.0, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 33.08, 0.0, 0.0, 0.0, 0.0, 0.0, 30.43], "audiomae_on_audioset": [null, null, null, null, [["fart", 28.92], ["hum", 12.6], ["hands", 12.02]], null, null, null, null, null, [["speech", 69.61], ["synthesizer", 9.2], ["music", 6.03]], null, [["speech", 77.59], ["radio", 5.56], ["sidetone", 3.65]], null, [["printer", 25.3], ["speech", 12.95], ["sliding door", 3.41]], null, null, null, null, null, [["music", 22.3], ["sidetone", 8.93], ["hum", 8.46]], [["hum", 33.08], ["mains hum", 17.69], ["music", 5.0]], null, null, null, null, null, [["hum", 20.06], ["mains hum", 15.1], ["eruption", 11.73]]], "duration": [0.24, 0.27, -0.06, 0.63, 6.63, 0.82, 1.19, 0.84, 1.49, 0.06, 3.69, 0.79, 3.8, 0.55, 2.85, 1.99, 0.02, 0.93, 1.04, 0.86, 3.38, 10.1, 0.96, 1.49, 0.81, 0.67, 0.89, 3.85]} \ No newline at end of file diff --git a/annotations_filtered/udHPeemZ8zE_filtered.json b/annotations_filtered/udHPeemZ8zE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72a63ce815bb57e2a42e7bfdd884b37041296ed5 --- /dev/null +++ b/annotations_filtered/udHPeemZ8zE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 5.95], [9.0, 9.83], [13.0, 13.1], [28.0, 27.67], [43.0, 43.66], [53.0, 53.22], [54.0, 55.85], [57.0, 58.04], [59.0, 60.1], [62.0, 62.41], [67.0, 67.91], [75.0, 75.07], [78.0, 80.74], [82.0, 83.19], [84.0, 85.19], [86.0, 87.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.95, 0.83, 0.1, -0.33, 0.66, 0.22, 1.85, 1.04, 1.1, 0.41, 0.91, 0.07, 2.74, 1.19, 1.19, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/udn4UB_EZ1E_filtered.json b/annotations_filtered/udn4UB_EZ1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e59429220f916d4f31c123e39d0fbf0265c287 --- /dev/null +++ b/annotations_filtered/udn4UB_EZ1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [6.0, 6.99], [12.0, 14.05], [23.0, 25.39], [26.0, 27.3], [29.0, 30.25], [40.0, 40.15], [45.0, 47.55], [51.0, 52.51]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.34, 58.89, 0.0, 0.0, 0.0, 82.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.99, 2.05, 2.39, 1.3, 1.25, 0.15, 2.55, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/udwKI7oFT6Y_filtered.json b/annotations_filtered/udwKI7oFT6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06798a97146d5a58c619795d113dfecb03d7f13b --- /dev/null +++ b/annotations_filtered/udwKI7oFT6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [11.0, 23.18], [24.0, 24.6], [28.0, 29.83], [32.0, 31.89], [32.0, 36.64], [38.0, 77.03], [79.0, 102.24], [107.0, 111.86]], "keep_status": [false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 35.51, 0.0, 0.0, 0.0, 36.0, 0.0, 31.37, 37.35], "audiomae_on_audioset": [null, [["music", 58.57], ["emergency vehicle", 8.67], ["siren", 6.72]], null, null, null, [["speech", 21.41], ["music", 18.69], ["siren", 17.33]], null, [["speech", 40.82], ["music", 12.92], ["gunshot, gunfire", 5.33]], [["speech", 39.59], ["music", 33.91], ["hum", 4.76]]], "duration": [1.94, 12.18, 0.6, 1.83, -0.11, 4.64, 39.03, 23.24, 4.86]} \ No newline at end of file diff --git a/annotations_filtered/ue0MJQmrIlg_filtered.json b/annotations_filtered/ue0MJQmrIlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9121d1c4cc02409583a1ba895066bda41670e81e --- /dev/null +++ b/annotations_filtered/ue0MJQmrIlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 21.74], [27.0, 31.26], [31.0, 32.46], [35.0, 34.97], [36.0, 38.03], [39.0, 39.36], [41.0, 40.91], [42.0, 45.15], [46.0, 59.37], [59.0, 63.46], [64.0, 65.64], [66.0, 66.38], [68.0, 68.86], [73.0, 74.71], [77.0, 85.09], [86.0, 87.66], [89.0, 95.82]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.21, 65.2, 0.0, 0.0, 37.47, 0.0, 0.0, 86.27, 51.66, 97.73, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 33.79], "audiomae_on_audioset": [null, null, null, null, [["music", 37.02], ["fart", 12.42], ["fly, housefly", 8.42]], null, null, null, null, null, null, null, null, null, null, null, [["music", 46.35], ["speech", 21.86], ["fart", 8.79]]], "duration": [17.74, 4.26, 1.46, -0.03, 2.03, 0.36, -0.09, 3.15, 13.37, 4.46, 1.64, 0.38, 0.86, 1.71, 8.09, 1.66, 6.82]} \ No newline at end of file diff --git a/annotations_filtered/ueAsO0Gq8vI_filtered.json b/annotations_filtered/ueAsO0Gq8vI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1558ec5bb68569a89a41f7da6253394847c8bb1f --- /dev/null +++ b/annotations_filtered/ueAsO0Gq8vI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.39], [8.0, 9.41], [10.0, 11.55], [12.0, 13.47], [14.0, 14.49], [17.0, 17.42], [20.0, 21.12], [22.0, 22.82], [23.0, 24.34], [25.0, 26.11], [27.0, 27.95], [28.0, 30.99], [32.0, 33.44], [34.0, 34.53], [38.0, 41.45], [42.0, 42.69], [43.0, 43.48], [44.0, 47.29], [48.0, 50.82], [55.0, 59.8], [61.0, 63.07], [64.0, 63.88], [72.0, 72.96], [74.0, 74.71], [76.0, 76.6], [77.0, 79.37], [81.0, 89.43], [93.0, 93.7], [95.0, 96.45], [102.0, 116.56], [118.0, 119.97], [122.0, 122.3], [123.0, 125.0], [126.0, 126.33], [127.0, 128.24], [128.0, 129.86], [144.0, 145.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 83.34, 0.0, 0.0, 67.25, 72.75, 38.12, 48.95, 0.0, 0.0, 0.0, 0.0, 38.42, 46.33, 0.0, 0.0, 36.72, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.4], ["musical instrument", 1.51], ["guitar", 1.18]], [["music", 52.59], ["throbbing", 10.11], ["techno", 4.7]], null, null, null, null, [["music", 39.36], ["speech", 7.8], ["carnatic music", 2.87]], [["music", 41.06], ["bleat", 5.39], ["sheep", 5.3]], null, null, [["music", 50.27], ["bowed string instrument", 7.25], ["musical instrument", 6.78]], null, null, null, null, null, null, null], "duration": [2.39, 1.41, 1.55, 1.47, 0.49, 0.42, 1.12, 0.82, 1.34, 1.11, 0.95, 2.99, 1.44, 0.53, 3.45, 0.69, 0.48, 3.29, 2.82, 4.8, 2.07, -0.12, 0.96, 0.71, 0.6, 2.37, 8.43, 0.7, 1.45, 14.56, 1.97, 0.3, 2.0, 0.33, 1.24, 1.86, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/ueMuCbXkDhw_filtered.json b/annotations_filtered/ueMuCbXkDhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c63f85aa61055358fef3594b1a2d67b0e0a09ea6 --- /dev/null +++ b/annotations_filtered/ueMuCbXkDhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.49], [22.0, 22.32], [26.0, 26.45], [32.0, 45.59], [51.0, 53.0], [58.0, 62.92], [67.0, 89.56]], "keep_status": [false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.5, 32.59, 33.58, 45.52], "audiomae_on_audioset": [null, null, null, [["music", 52.83], ["dog", 8.88], ["animal", 7.57]], [["music", 40.12], ["grunt", 11.04], ["musical instrument", 7.68]], [["music", 56.78], ["musical instrument", 7.06], ["synthesizer", 5.9]], [["hum", 34.28], ["music", 26.08], ["throbbing", 11.14]]], "duration": [0.49, 0.32, 0.45, 13.59, 2.0, 4.92, 22.56]} \ No newline at end of file diff --git a/annotations_filtered/ueNjp9QfQFM_filtered.json b/annotations_filtered/ueNjp9QfQFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5effdc4db58f305da5a3d9f0c7f97b8ee0fcbe17 --- /dev/null +++ b/annotations_filtered/ueNjp9QfQFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [6.0, 10.98], [13.0, 26.69], [28.0, 30.7], [34.0, 34.2], [36.0, 36.86], [38.0, 38.53], [41.0, 42.65], [43.0, 47.01], [50.0, 55.29], [59.0, 58.97], [65.0, 65.25], [68.0, 67.86], [69.0, 72.67], [79.0, 100.9], [104.0, 117.9], [120.0, 120.53], [124.0, 124.19], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.55, 74.13, 85.72, 95.51, 0.0, 0.0, 0.0, 0.0, 81.71, 56.4, 0.0, 0.0, 0.0, 81.17, 87.19, 58.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.36, 4.98, 13.69, 2.7, 0.2, 0.86, 0.53, 1.65, 4.01, 5.29, -0.03, 0.25, -0.14, 3.67, 21.9, 13.9, 0.53, 0.19, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/ueR0lJzIxWo_filtered.json b/annotations_filtered/ueR0lJzIxWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a66fef2240f3ad25d37da70df04dc08ff2d8cb5e --- /dev/null +++ b/annotations_filtered/ueR0lJzIxWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.04], [34.0, 35.09], [37.0, 38.33], [40.0, 43.44], [45.0, 58.46], [61.0, 67.14]], "keep_status": [false, false, false, false, false, false], "silence_prob": [91.3, 0.0, 0.0, 100.0, 84.62, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [3.04, 1.09, 1.33, 3.44, 13.46, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/ue_EAEC12X0_filtered.json b/annotations_filtered/ue_EAEC12X0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6c2932f3c2eef459a51a70a056f1cc6cce7d0a9 --- /dev/null +++ b/annotations_filtered/ue_EAEC12X0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.8], [12.0, 13.1], [15.0, 15.55], [19.0, 18.79], [26.0, 27.72], [36.0, 37.05], [43.0, 45.1], [55.0, 54.85], [60.0, 60.37], [74.0, 75.24], [79.0, 91.02], [102.0, 112.16], [113.0, 114.42], [125.0, 125.86], [140.0, 141.45], [143.0, 143.26], [146.0, 145.93], [155.0, 155.83], [157.0, 157.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 47.98, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 81.45], ["bass guitar", 3.89], ["guitar", 3.26]], null, null, null, null, null, null, null, null], "duration": [0.8, 1.1, 0.55, -0.21, 1.72, 1.05, 2.1, -0.15, 0.37, 1.24, 12.02, 10.16, 1.42, 0.86, 1.45, 0.26, -0.07, 0.83, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/uen_1bL_TXc_filtered.json b/annotations_filtered/uen_1bL_TXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3dfabc411e319448c8a50bf0747f47d6aecd5ef --- /dev/null +++ b/annotations_filtered/uen_1bL_TXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.09], [17.0, 19.7], [21.0, 92.55], [93.0, 105.93], [112.0, 124.23], [128.0, 140.24], [146.0, 146.67], [149.0, 153.76], [155.0, 159.58], [161.0, 163.76], [165.0, 166.65]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [36.25, 46.29, 0.0, 29.89, 29.03, 28.85, 0.0, 92.64, 82.79, 97.0, 0.0], "audiomae_on_audioset": [[["music", 45.95], ["didgeridoo", 24.24], ["speech", 4.64]], [["sidetone", 90.34], ["speech", 1.77], ["radio", 1.41]], null, [["music", 62.47], ["synthetic singing", 7.1], ["boing", 4.4]], [["music", 46.4], ["speech", 44.33], ["throbbing", 0.73]], [["music", 44.03], ["throbbing", 9.35], ["speech", 4.95]], null, null, null, null, null], "duration": [8.09, 2.7, 71.55, 12.93, 12.23, 12.24, 0.67, 4.76, 4.58, 2.76, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/uf-v_lzbcp0_filtered.json b/annotations_filtered/uf-v_lzbcp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b48c032bdcdbea621e920886f2903066e447aba5 --- /dev/null +++ b/annotations_filtered/uf-v_lzbcp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 34.38], [37.0, 52.81], [54.0, 59.09], [61.0, 61.15], [62.0, 62.36], [64.0, 86.34], [88.0, 89.28], [93.0, 97.43], [98.0, 104.87], [107.0, 107.72], [110.0, 131.73], [135.0, 157.28]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 31.51, 30.89, 0.0, 0.0, 31.66, 0.0, 29.9, 41.42, 0.0, 72.6, 47.54], "audiomae_on_audioset": [null, [["music", 41.81], ["speech", 28.07], ["throbbing", 7.25]], [["music", 53.03], ["hum", 20.07], ["throbbing", 9.68]], null, null, [["speech", 40.03], ["music", 33.55], ["didgeridoo", 4.14]], null, [["music", 24.23], ["speech", 19.37], ["noise", 10.23]], [["hum", 36.57], ["speech", 18.73], ["throbbing", 15.11]], null, null, [["music", 71.07], ["hum", 4.59], ["echo", 3.14]]], "duration": [33.38, 15.81, 5.09, 0.15, 0.36, 22.34, 1.28, 4.43, 6.87, 0.72, 21.73, 22.28]} \ No newline at end of file diff --git a/annotations_filtered/ufF5p8VBsVk_filtered.json b/annotations_filtered/ufF5p8VBsVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a414a50192698f84970dc03cfaf424f3960de61a --- /dev/null +++ b/annotations_filtered/ufF5p8VBsVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 95.07], [95.0, 99.17], [99.0, 102.47], [103.0, 109.29], [110.0, 112.16], [116.0, 118.72]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 75.39, 78.72, 90.6, 87.19, 72.16], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [66.07, 4.17, 3.47, 6.29, 2.16, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/ufllQr0ClXg_filtered.json b/annotations_filtered/ufllQr0ClXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e85e3b74335ee3d5e95c754db5834f1e1d23d7a7 --- /dev/null +++ b/annotations_filtered/ufllQr0ClXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 36.02], [40.0, 51.36], [53.0, 54.84], [55.0, 56.12], [59.0, 59.8], [62.0, 62.82], [66.0, 73.21], [73.0, 73.97], [75.0, 84.74], [90.0, 93.46], [95.0, 99.91], [103.0, 103.2], [106.0, 106.44], [115.0, 116.6], [118.0, 127.14], [135.0, 138.81], [139.0, 140.8], [143.0, 143.45], [145.0, 146.47], [148.0, 150.13], [153.0, 159.68], [161.0, 163.49], [169.0, 169.6], [173.0, 174.33], [176.0, 179.85], [186.0, 189.63], [190.0, 191.76], [198.0, 198.61], [203.0, 203.89], [205.0, 205.82], [208.0, 208.5], [209.0, 210.22]], "keep_status": [true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [42.93, 40.33, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 41.7, 49.54, 43.85, 0.0, 0.0, 0.0, 80.29, 51.71, 0.0, 0.0, 0.0, 55.53, 53.28, 76.86, 0.0, 0.0, 52.98, 45.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.18], ["synthesizer", 11.49], ["hum", 11.41]], [["fart", 43.07], ["music", 32.18], ["guitar", 3.34]], null, null, null, null, null, null, [["music", 52.21], ["speech", 12.27], ["cattle, bovinae", 4.77]], [["cattle, bovinae", 28.9], ["moo", 21.52], ["livestock, farm animals, working animals", 13.48]], [["music", 28.98], ["speech", 21.65], ["fly, housefly", 5.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.06], ["musical instrument", 5.4], ["synthesizer", 5.28]], null, null, null, null, null, null], "duration": [19.02, 11.36, 1.84, 1.12, 0.8, 0.82, 7.21, 0.97, 9.74, 3.46, 4.91, 0.2, 0.44, 1.6, 9.14, 3.81, 1.8, 0.45, 1.47, 2.13, 6.68, 2.49, 0.6, 1.33, 3.85, 3.63, 1.76, 0.61, 0.89, 0.82, 0.5, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/ugXeKGSjvKw_filtered.json b/annotations_filtered/ugXeKGSjvKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14e01094992bc7b3ccca1b11f930745907bd322d --- /dev/null +++ b/annotations_filtered/ugXeKGSjvKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [10.0, 10.66], [11.0, 55.36], [57.0, 62.82], [65.0, 65.47], [65.0, 65.5], [66.0, 71.1]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 35.57, 0.0, 0.0, 33.09], "audiomae_on_audioset": [null, null, null, [["music", 42.49], ["mains hum", 24.91], ["hum", 12.11]], null, null, [["theremin", 34.7], ["music", 21.58], ["noise", 6.74]]], "duration": [0.49, 0.66, 44.36, 5.82, 0.47, 0.5, 5.1]} \ No newline at end of file diff --git a/annotations_filtered/ugm8RMqRSxs_filtered.json b/annotations_filtered/ugm8RMqRSxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9232a66649842d270a899969404e8271b353c8de --- /dev/null +++ b/annotations_filtered/ugm8RMqRSxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 27.9], [28.0, 28.17], [28.0, 29.13], [29.0, 34.91], [39.0, 38.55], [39.0, 38.85], [39.0, 47.49], [60.0, 66.77], [68.0, 69.15], [70.0, 71.51], [72.0, 73.57], [75.0, 75.76], [76.0, 75.96], [76.0, 81.65], [91.0, 91.71], [92.0, 93.66], [95.0, 95.66], [119.0, 119.37], [124.0, 124.9], [126.0, 126.59], [127.0, 128.26], [129.0, 130.3], [131.0, 132.19]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.35, 0.0, 0.0, 32.77, 0.0, 0.0, 33.59, 32.68, 0.0, 0.0, 0.0, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.91], ["speech", 15.02], ["throbbing", 4.84]], null, null, [["music", 33.61], ["speech", 21.58], ["hum", 10.58]], null, null, [["music", 39.11], ["theremin", 13.91], ["speech", 10.89]], [["music", 39.48], ["speech", 28.97], ["hum", 4.47]], null, null, null, null, null, [["foghorn", 35.78], ["speech", 26.92], ["music", 19.45]], null, null, null, null, null, null, null, null, null], "duration": [7.9, 0.17, 1.13, 5.91, -0.45, -0.15, 8.49, 6.77, 1.15, 1.51, 1.57, 0.76, -0.04, 5.65, 0.71, 1.66, 0.66, 0.37, 0.9, 0.59, 1.26, 1.3, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/uh677-ClXCY_filtered.json b/annotations_filtered/uh677-ClXCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb16237a2977cde77c007921050adde83ce2b1d8 --- /dev/null +++ b/annotations_filtered/uh677-ClXCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.68], [16.0, 16.6], [19.0, 26.43], [28.0, 28.32], [29.0, 35.11], [36.0, 36.53], [38.0, 38.38], [39.0, 39.72], [41.0, 41.72], [43.0, 43.78], [45.0, 45.52], [47.0, 47.78], [49.0, 51.46], [55.0, 55.36], [57.0, 60.61], [62.0, 63.78], [66.0, 67.8], [68.0, 68.96], [70.0, 70.9], [71.0, 71.76], [74.0, 74.26], [76.0, 75.9], [79.0, 84.77], [87.0, 87.07], [88.0, 88.6], [91.0, 91.23], [92.0, 93.07], [95.0, 95.52], [97.0, 98.93], [99.0, 99.42], [100.0, 102.78], [106.0, 106.71], [110.0, 111.32], [118.0, 122.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 50.76, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 40.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.12, 0.0, 0.0, 30.29], "audiomae_on_audioset": [null, null, null, null, [["music", 61.9], ["hum", 6.45], ["electronic music", 3.92]], null, null, null, null, null, null, null, null, null, [["music", 70.93], ["electronic music", 3.59], ["synthesizer", 3.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.32], ["throbbing", 20.55], ["hum", 7.49]]], "duration": [0.68, 0.6, 7.43, 0.32, 6.11, 0.53, 0.38, 0.72, 0.72, 0.78, 0.52, 0.78, 2.46, 0.36, 3.61, 1.78, 1.8, 0.96, 0.9, 0.76, 0.26, -0.1, 5.77, 0.07, 0.6, 0.23, 1.07, 0.52, 1.93, 0.42, 2.78, 0.71, 1.32, 4.67]} \ No newline at end of file diff --git a/annotations_filtered/uhBhYnRrOg4_filtered.json b/annotations_filtered/uhBhYnRrOg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..679d4a0a7e0a37e62f2cac2e8d25a8e6b861166c --- /dev/null +++ b/annotations_filtered/uhBhYnRrOg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.07], [17.0, 17.37], [31.0, 39.45], [48.0, 49.84], [51.0, 58.82], [63.0, 70.24], [77.0, 79.89], [88.0, 89.02], [91.0, 92.89], [95.0, 96.03], [98.0, 98.59], [99.0, 120.85]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.58, 0.0, 33.05, 35.15, 36.32, 0.0, 0.0, 0.0, 0.0, 32.0], "audiomae_on_audioset": [null, null, [["music", 77.15], ["didgeridoo", 5.04], ["timpani", 1.91]], null, [["music", 47.0], ["synthesizer", 9.34], ["noise", 4.29]], [["cattle, bovinae", 44.84], ["livestock, farm animals, working animals", 29.24], ["moo", 25.88]], [["hum", 24.62], ["throbbing", 19.54], ["music", 8.49]], null, null, null, null, [["speech", 32.85], ["music", 23.47], ["hum", 12.05]]], "duration": [1.07, 0.37, 8.45, 1.84, 7.82, 7.24, 2.89, 1.02, 1.89, 1.03, 0.59, 21.85]} \ No newline at end of file diff --git a/annotations_filtered/uhDhzHrffBQ_filtered.json b/annotations_filtered/uhDhzHrffBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f571c35ed2df36c4af44b9d71761eafdb038ea2 --- /dev/null +++ b/annotations_filtered/uhDhzHrffBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.76], [22.0, 26.55], [33.0, 37.57], [42.0, 43.07], [46.0, 46.2], [59.0, 60.91], [62.0, 63.22], [67.0, 71.51], [72.0, 72.79], [75.0, 76.62], [77.0, 77.79], [81.0, 84.57], [85.0, 112.43], [119.0, 145.54], [150.0, 150.63], [151.0, 152.39], [153.0, 154.03], [155.0, 156.09], [165.0, 166.31], [169.0, 169.92], [171.0, 171.91], [173.0, 173.53], [188.0, 188.79], [190.0, 190.46], [193.0, 194.53], [201.0, 202.0], [204.0, 204.26], [205.0, 205.38], [206.0, 206.95], [208.0, 208.6], [211.0, 211.3], [214.0, 214.76], [216.0, 216.21], [218.0, 218.19], [222.0, 222.37], [223.0, 223.67], [224.0, 228.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 29.48, 31.47, 0.0, 0.0, 0.0, 0.0, 36.45, 0.0, 0.0, 0.0, 38.41, 30.43, 29.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.02], "audiomae_on_audioset": [null, [["whip", 52.98], ["speech", 16.73], ["meow", 2.89]], [["speech", 48.8], ["boing", 28.62], ["cacophony", 2.74]], null, null, null, null, [["music", 61.85], ["speech", 5.71], ["foghorn", 3.57]], null, null, null, [["music", 51.98], ["hum", 7.82], ["throbbing", 7.23]], [["music", 78.2], ["speech", 4.55], ["drum machine", 3.46]], [["music", 30.02], ["speech", 16.33], ["smash, crash", 7.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.3], ["whale vocalization", 10.85], ["animal", 8.31]]], "duration": [0.76, 4.55, 4.57, 1.07, 0.2, 1.91, 1.22, 4.51, 0.79, 1.62, 0.79, 3.57, 27.43, 26.54, 0.63, 1.39, 1.03, 1.09, 1.31, 0.92, 0.91, 0.53, 0.79, 0.46, 1.53, 1.0, 0.26, 0.38, 0.95, 0.6, 0.3, 0.76, 0.21, 0.19, 0.37, 0.67, 4.53]} \ No newline at end of file diff --git a/annotations_filtered/uhH9ewIEbnU_filtered.json b/annotations_filtered/uhH9ewIEbnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be41d53b94f7dbf6ed1724c12a2126156d3cd479 --- /dev/null +++ b/annotations_filtered/uhH9ewIEbnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [20.0, 21.46], [37.0, 37.37], [47.0, 47.83], [59.0, 60.51], [72.0, 75.17], [77.0, 77.23], [82.0, 82.43], [87.0, 89.36], [93.0, 94.31], [95.0, 95.99], [100.0, 101.76], [102.0, 102.54], [104.0, 107.05], [108.0, 109.02], [111.0, 113.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 80.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.46, 0.37, 0.83, 1.51, 3.17, 0.23, 0.43, 2.36, 1.31, 0.99, 1.76, 0.54, 3.05, 1.02, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/uhkfz535fR8_filtered.json b/annotations_filtered/uhkfz535fR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cccd5f7956540169ffb16c697acffa59d9b9f408 --- /dev/null +++ b/annotations_filtered/uhkfz535fR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 4.78], [6.0, 16.56], [18.0, 20.44], [23.0, 23.84], [26.0, 72.67], [75.0, 75.36], [78.0, 79.42], [81.0, 81.11], [82.0, 83.03], [84.0, 83.86], [87.0, 87.37], [89.0, 91.37], [92.0, 109.48], [111.0, 110.74], [112.0, 114.08], [115.0, 115.25], [116.0, 130.54], [136.0, 145.18], [147.0, 147.36], [151.0, 180.54]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 35.71, 40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.14, 34.22, 0.0, 55.96, 0.0, 33.35, 32.42, 0.0, 33.52], "audiomae_on_audioset": [null, null, [["music", 20.23], ["hum", 12.72], ["vehicle", 8.52]], [["speech", 66.03], ["vehicle", 4.75], ["hum", 4.23]], null, null, null, null, null, null, null, null, [["music", 31.23], ["buzz", 13.23], ["hum", 6.63]], [["throbbing", 23.25], ["music", 19.22], ["hum", 17.84]], null, null, null, [["speech", 45.28], ["music", 31.89], ["didgeridoo", 14.71]], [["music", 49.53], ["throbbing", 7.92], ["drum and bass", 4.51]], null, [["music", 20.37], ["throbbing", 13.07], ["speech", 12.91]]], "duration": [1.57, 0.78, 10.56, 2.44, 0.84, 46.67, 0.36, 1.42, 0.11, 1.03, -0.14, 0.37, 2.37, 17.48, -0.26, 2.08, 0.25, 14.54, 9.18, 0.36, 29.54]} \ No newline at end of file diff --git a/annotations_filtered/uhpknFQJ7G0_filtered.json b/annotations_filtered/uhpknFQJ7G0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d02de13337b4085c6b9352581c44ce69a0857963 --- /dev/null +++ b/annotations_filtered/uhpknFQJ7G0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [2.0, 3.67], [4.0, 5.07], [15.0, 15.4], [18.0, 18.64], [39.0, 39.5], [41.0, 42.62], [44.0, 46.36], [48.0, 49.92], [51.0, 53.37], [57.0, 57.89], [59.0, 61.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 53.1, 0.0, 77.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 1.67, 1.07, 0.4, 0.64, 0.5, 1.62, 2.36, 1.92, 2.37, 0.89, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/ui3pnIeA_HM_filtered.json b/annotations_filtered/ui3pnIeA_HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8f047c1182535886f779474e60815415fd767d --- /dev/null +++ b/annotations_filtered/ui3pnIeA_HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 24.31], [25.0, 24.97], [25.0, 36.85], [38.0, 38.67], [40.0, 43.51], [45.0, 45.13], [47.0, 48.02], [51.0, 58.36], [60.0, 61.1], [62.0, 63.88], [77.0, 77.11], [77.0, 77.55], [78.0, 77.67], [78.0, 77.95], [79.0, 79.96], [82.0, 83.22], [84.0, 86.24], [88.0, 88.99], [90.0, 91.02], [98.0, 101.04], [102.0, 103.01], [104.0, 104.67], [108.0, 108.51], [111.0, 112.08], [114.0, 115.91], [119.0, 120.65], [121.0, 122.07], [123.0, 127.67], [129.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.31, 0.0, 87.55, 0.0, 53.53, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.31, -0.03, 11.85, 0.67, 3.51, 0.13, 1.02, 7.36, 1.1, 1.88, 0.11, 0.55, -0.33, -0.05, 0.96, 1.22, 2.24, 0.99, 1.02, 3.04, 1.01, 0.67, 0.51, 1.08, 1.91, 1.65, 1.07, 4.67, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/uifDWAJ6rBY_filtered.json b/annotations_filtered/uifDWAJ6rBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uifDWAJ6rBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uiik3zS4y4I_filtered.json b/annotations_filtered/uiik3zS4y4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e69b4befdddd4530d4a4b46114ad5b8eca223db --- /dev/null +++ b/annotations_filtered/uiik3zS4y4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [4.0, 3.64], [17.0, 20.53], [24.0, 26.27], [29.0, 30.28], [31.0, 31.14], [32.0, 32.21], [34.0, 34.21], [35.0, 36.17], [40.0, 40.58], [41.0, 43.58], [46.0, 46.65], [53.0, 53.86], [56.0, 55.95], [63.0, 64.2], [71.0, 71.31], [75.0, 76.49], [80.0, 79.68], [84.0, 88.79], [91.0, 91.17], [93.0, 96.65], [102.0, 103.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 50.31, 54.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.64, 0.0, 38.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.88], ["baby laughter", 10.78], ["bleat", 3.98]], null], "duration": [0.5, -0.36, 3.53, 2.27, 1.28, 0.14, 0.21, 0.21, 1.17, 0.58, 2.58, 0.65, 0.86, -0.05, 1.2, 0.31, 1.49, -0.32, 4.79, 0.17, 3.65, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/uioT_3dqzXc_filtered.json b/annotations_filtered/uioT_3dqzXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b100f32339e89a162d98af56091b99747d93d7d7 --- /dev/null +++ b/annotations_filtered/uioT_3dqzXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.26], [12.0, 31.35], [31.0, 33.72], [35.0, 60.02], [63.0, 89.88], [92.0, 104.67], [107.0, 109.05], [109.0, 109.63]], "keep_status": [true, false, true, true, true, false, true, false], "silence_prob": [30.5, 29.77, 29.73, 30.44, 29.92, 30.26, 30.15, 0.0], "audiomae_on_audioset": [[["music", 35.28], ["mains hum", 17.17], ["musical instrument", 10.04]], [["speech", 79.54], ["vehicle", 7.05], ["music", 3.18]], [["speech", 27.78], ["music", 10.51], ["didgeridoo", 5.97]], [["explosion", 23.35], ["music", 20.66], ["burst, pop", 8.47]], [["music", 47.06], ["hum", 12.6], ["throbbing", 6.13]], [["hum", 46.63], ["mains hum", 39.95], ["throbbing", 5.11]], [["music", 41.82], ["synthesizer", 7.8], ["musical instrument", 7.72]], null], "duration": [2.26, 19.35, 2.72, 25.02, 26.88, 12.67, 2.05, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/uirBWk-qd9A_filtered.json b/annotations_filtered/uirBWk-qd9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f6c20ab32470074de2e444006df3a96433ea0d3 --- /dev/null +++ b/annotations_filtered/uirBWk-qd9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.59], [18.0, 20.66], [21.0, 26.57], [29.0, 30.11], [30.0, 31.7], [33.0, 34.26], [35.0, 36.32], [40.0, 40.93], [42.0, 42.82], [44.0, 50.5], [51.0, 51.78], [54.0, 54.3], [55.0, 56.29], [62.0, 63.26], [65.0, 65.6], [67.0, 66.92], [67.0, 77.03], [79.0, 84.37], [85.0, 85.09], [85.0, 86.78], [91.0, 92.3]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.81, 35.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.83, 30.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 27.72], ["musical instrument", 10.86], ["guitar", 6.49]], [["music", 52.5], ["guitar", 8.1], ["plucked string instrument", 7.01]], null, null, null, null, null, null, [["music", 54.31], ["effects unit", 11.67], ["guitar", 6.1]], null, null, null, null, null, null, [["music", 74.29], ["theremin", 4.28], ["didgeridoo", 4.27]], [["music", 77.44], ["synthesizer", 7.53], ["chorus effect", 1.58]], null, null, null], "duration": [0.59, 2.66, 5.57, 1.11, 1.7, 1.26, 1.32, 0.93, 0.82, 6.5, 0.78, 0.3, 1.29, 1.26, 0.6, -0.08, 10.03, 5.37, 0.09, 1.78, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/uiy-sT9JgRo_filtered.json b/annotations_filtered/uiy-sT9JgRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..176ae75bf552e31a6505dd8e895d581b5ca7f911 --- /dev/null +++ b/annotations_filtered/uiy-sT9JgRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.71], [11.0, 11.08], [15.0, 17.02], [18.0, 20.43], [22.0, 27.33], [29.0, 29.91], [31.0, 32.51], [33.0, 39.26], [42.0, 44.25], [45.0, 46.63], [49.0, 49.89], [51.0, 61.1], [63.0, 64.2], [66.0, 66.43], [68.0, 68.71], [69.0, 69.87], [71.0, 74.43], [76.0, 82.83], [85.0, 85.83], [87.0, 87.79], [90.0, 90.85], [92.0, 93.88], [95.0, 96.04], [101.0, 101.92], [105.0, 105.87], [109.0, 110.2], [114.0, 114.86], [117.0, 118.17]], "keep_status": [true, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.09, 0.0, 45.72, 46.05, 42.86, 0.0, 0.0, 44.04, 59.96, 0.0, 0.0, 37.55, 0.0, 0.0, 0.0, 0.0, 39.77, 34.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 30.01], ["speech", 18.9], ["music", 8.63]], null, [["music", 28.69], ["frog", 11.83], ["speech", 3.51]], [["cough", 15.22], ["music", 14.65], ["singing bowl", 13.61]], [["music", 43.46], ["effects unit", 8.79], ["guitar", 7.58]], null, null, [["music", 36.35], ["speech", 22.99], ["hum", 11.96]], null, null, null, [["music", 70.61], ["guitar", 2.45], ["plucked string instrument", 2.2]], null, null, null, null, [["music", 54.57], ["harp", 5.23], ["musical instrument", 3.87]], [["music", 44.6], ["hum", 17.6], ["speech", 13.1]], null, null, null, null, null, null, null, null, null, null], "duration": [3.71, 0.08, 2.02, 2.43, 5.33, 0.91, 1.51, 6.26, 2.25, 1.63, 0.89, 10.1, 1.2, 0.43, 0.71, 0.87, 3.43, 6.83, 0.83, 0.79, 0.85, 1.88, 1.04, 0.92, 0.87, 1.2, 0.86, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/uj8ftsuP8T4_filtered.json b/annotations_filtered/uj8ftsuP8T4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e835b0304ca5ed7a7c8a2ccad087d5fbf47ccf0 --- /dev/null +++ b/annotations_filtered/uj8ftsuP8T4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.11], [6.0, 15.33]], "keep_status": [false, true], "silence_prob": [36.6, 39.58], "audiomae_on_audioset": [[["music", 54.62], ["speech", 32.2], ["thunk", 1.71]], [["music", 41.34], ["speech", 9.73], ["synthesizer", 8.75]]], "duration": [3.11, 9.33]} \ No newline at end of file diff --git a/annotations_filtered/ujA70PK6E7U_filtered.json b/annotations_filtered/ujA70PK6E7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88ea73b7346adc368fc7f60ff8c6b76933616df1 --- /dev/null +++ b/annotations_filtered/ujA70PK6E7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 34.38], [36.0, 45.94], [47.0, 53.16], [57.0, 58.9], [64.0, 123.08], [126.0, 152.91], [156.0, 156.47]], "keep_status": [false, true, true, false, false, true, false], "silence_prob": [31.18, 30.85, 32.23, 0.0, 0.0, 30.0, 0.0], "audiomae_on_audioset": [[["speech", 67.57], ["whale vocalization", 19.21], ["music", 7.58]], [["whale vocalization", 30.79], ["vehicle", 11.63], ["music", 11.51]], [["whale vocalization", 23.94], ["music", 20.2], ["speech", 14.29]], null, null, [["speech", 51.95], ["music", 11.4], ["hum", 3.84]], null], "duration": [29.38, 9.94, 6.16, 1.9, 59.08, 26.91, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/ujEbejephNM_filtered.json b/annotations_filtered/ujEbejephNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebad34aeb3acb5f0b114a9191dcdb5dc23d67dab --- /dev/null +++ b/annotations_filtered/ujEbejephNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.48], [12.0, 12.53], [13.0, 13.78], [16.0, 16.6], [17.0, 17.79], [21.0, 21.32], [22.0, 22.1], [28.0, 28.02], [39.0, 39.26], [43.0, 46.38], [49.0, 54.75], [57.0, 57.75], [59.0, 61.16], [64.0, 64.94], [67.0, 67.71], [75.0, 77.33], [82.0, 82.54], [85.0, 85.56], [101.0, 103.01], [103.0, 103.72], [107.0, 108.26], [110.0, 110.88], [115.0, 114.96], [115.0, 117.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 67.25, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 84.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 0.53, 0.78, 0.6, 0.79, 0.32, 0.1, 0.02, 0.26, 3.38, 5.75, 0.75, 2.16, 0.94, 0.71, 2.33, 0.54, 0.56, 2.01, 0.72, 1.26, 0.88, -0.04, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/ujFOaYo5QME_filtered.json b/annotations_filtered/ujFOaYo5QME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae66a4e076bd52964c073a6ec64a4d579f3d0a76 --- /dev/null +++ b/annotations_filtered/ujFOaYo5QME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.51], [11.0, 12.39], [20.0, 20.58], [23.0, 23.9], [24.0, 24.02], [29.0, 29.54], [37.0, 37.64], [40.0, 40.36], [48.0, 48.88], [59.0, 59.75], [69.0, 69.16], [71.0, 71.9], [74.0, 74.46], [77.0, 77.67], [80.0, 80.43], [89.0, 89.23], [93.0, 93.77], [98.0, 98.41], [102.0, 102.47], [106.0, 106.05], [109.0, 109.05], [110.0, 110.52], [124.0, 124.56], [126.0, 126.69], [130.0, 130.47], [133.0, 134.23], [145.0, 145.35], [153.0, 153.54], [159.0, 159.7], [165.0, 165.4], [167.0, 167.63], [169.0, 168.89], [171.0, 171.17], [173.0, 173.72], [181.0, 181.28], [185.0, 185.95], [189.0, 189.67], [191.0, 191.81], [195.0, 195.1], [196.0, 196.82], [201.0, 202.15], [203.0, 202.88], [204.0, 204.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.39, 0.58, 0.9, 0.02, 0.54, 0.64, 0.36, 0.88, 0.75, 0.16, 0.9, 0.46, 0.67, 0.43, 0.23, 0.77, 0.41, 0.47, 0.05, 0.05, 0.52, 0.56, 0.69, 0.47, 1.23, 0.35, 0.54, 0.7, 0.4, 0.63, -0.11, 0.17, 0.72, 0.28, 0.95, 0.67, 0.81, 0.1, 0.82, 1.15, -0.12, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/ujFUQwcAQ7w_filtered.json b/annotations_filtered/ujFUQwcAQ7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6625bd202bd3400e98fe0a31303d926eaebf102 --- /dev/null +++ b/annotations_filtered/ujFUQwcAQ7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.69], [15.0, 15.57], [17.0, 18.44], [20.0, 21.17], [23.0, 24.26], [27.0, 31.83], [33.0, 34.6], [35.0, 38.33], [40.0, 44.1], [45.0, 58.51], [59.0, 62.99], [63.0, 67.81], [68.0, 72.08], [73.0, 79.34], [80.0, 84.11], [85.0, 93.92], [94.0, 97.58], [100.0, 100.5], [102.0, 105.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 99.21, 100.0, 85.35, 72.46, 70.02, 68.28, 62.68, 97.73, 97.54, 90.25, 0.0, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.69, 0.57, 1.44, 1.17, 1.26, 4.83, 1.6, 3.33, 4.1, 13.51, 3.99, 4.81, 4.08, 6.34, 4.11, 8.92, 3.58, 0.5, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/ujX0y3zcvP8_filtered.json b/annotations_filtered/ujX0y3zcvP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e783c56cbbba764d4527340fc475d3e770036567 --- /dev/null +++ b/annotations_filtered/ujX0y3zcvP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [9.0, 23.26], [24.0, 24.93], [29.0, 35.68]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 54.04, 0.0, 37.24], "audiomae_on_audioset": [null, null, null, [["speech", 31.82], ["music", 29.78], ["throbbing", 11.21]]], "duration": [0.89, 14.26, 0.93, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/ujcglOdwI1E_filtered.json b/annotations_filtered/ujcglOdwI1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c61a3604f6c7f58ca08c67e14cc9e426685ee451 --- /dev/null +++ b/annotations_filtered/ujcglOdwI1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.05], [29.0, 30.23], [33.0, 36.56], [38.0, 38.47], [45.0, 45.47], [46.0, 50.3], [51.0, 51.88], [53.0, 53.69], [65.0, 66.82], [68.0, 75.57], [79.0, 84.18], [85.0, 97.97]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 57.25, 0.0, 0.0, 37.66, 0.0, 0.0, 0.0, 33.97, 29.08, 29.22], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 18.29], ["hum", 12.95], ["whale vocalization", 11.62]], null, null, null, [["music", 40.21], ["hum", 12.46], ["static", 7.34]], [["music", 27.35], ["didgeridoo", 15.53], ["mains hum", 12.71]], [["music", 72.39], ["throbbing", 4.59], ["skateboard", 2.9]]], "duration": [0.05, 1.23, 3.56, 0.47, 0.47, 4.3, 0.88, 0.69, 1.82, 7.57, 5.18, 12.97]} \ No newline at end of file diff --git a/annotations_filtered/ujgbo-_khSM_filtered.json b/annotations_filtered/ujgbo-_khSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e585bc48ac1a08ca6f2f02ee3cc046e4cbff20c4 --- /dev/null +++ b/annotations_filtered/ujgbo-_khSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.89], [12.0, 13.05], [14.0, 16.46], [27.0, 27.28], [31.0, 31.65], [32.0, 37.61], [43.0, 44.15], [46.0, 45.81], [49.0, 49.94], [56.0, 56.15], [76.0, 76.54], [82.0, 82.05], [88.0, 88.7], [91.0, 91.0], [92.0, 92.79], [97.0, 97.24], [100.0, 103.03], [104.0, 105.44], [107.0, 113.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.53, 0.0, 90.95, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 38.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.93], ["fart", 38.79], ["inside, small room", 2.14]]], "duration": [9.89, 1.05, 2.46, 0.28, 0.65, 5.61, 1.15, -0.19, 0.94, 0.15, 0.54, 0.05, 0.7, 0.0, 0.79, 0.24, 3.03, 1.44, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/ujhXgFBjcZA_filtered.json b/annotations_filtered/ujhXgFBjcZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5e3b2687c3b0542f1b9696915731abffad857fb --- /dev/null +++ b/annotations_filtered/ujhXgFBjcZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.83], [10.0, 42.5], [43.0, 44.27], [51.0, 54.5], [57.0, 57.82], [61.0, 62.28], [65.0, 65.7], [69.0, 69.58], [71.0, 71.46], [74.0, 74.93], [76.0, 79.0], [81.0, 82.29], [83.0, 84.27], [85.0, 85.85], [87.0, 93.56], [95.0, 101.02], [102.0, 102.63], [104.0, 107.28], [108.0, 111.38], [112.0, 112.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [47.16, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 0.0, 36.0, 87.0, 0.0, 57.64, 38.97, 0.0], "audiomae_on_audioset": [[["music", 57.54], ["throbbing", 16.97], ["hum", 7.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.89], ["throbbing", 6.95], ["hum", 6.28]], null, null, null, [["music", 44.54], ["speech", 16.76], ["synthesizer", 7.49]], null], "duration": [4.83, 32.5, 1.27, 3.5, 0.82, 1.28, 0.7, 0.58, 0.46, 0.93, 3.0, 1.29, 1.27, 0.85, 6.56, 6.02, 0.63, 3.28, 3.38, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/ujxDA9VsQG4_filtered.json b/annotations_filtered/ujxDA9VsQG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ce2828141af6cecdd0552125d27c031625d1898 --- /dev/null +++ b/annotations_filtered/ujxDA9VsQG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.71], [7.0, 8.09], [9.0, 9.53], [10.0, 27.24], [30.0, 30.69], [32.0, 46.6], [50.0, 51.26], [53.0, 54.28], [56.0, 57.3], [60.0, 61.79], [63.0, 64.2], [68.0, 68.79], [70.0, 70.9], [72.0, 73.08], [74.0, 74.87], [76.0, 77.63], [84.0, 84.13], [87.0, 90.27], [91.0, 92.38], [94.0, 96.38], [98.0, 100.08], [101.0, 101.75], [102.0, 103.55], [106.0, 105.95], [106.0, 107.06], [114.0, 113.98], [119.0, 119.28], [119.0, 144.56], [147.0, 147.39], [150.0, 150.55], [165.0, 166.06], [167.0, 167.75], [169.0, 170.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.64, 0.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 32.19, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.12, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 55.11], ["speech", 29.21], ["radio", 2.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 17.52], ["speech", 14.63], ["fart", 7.55]], null, null, null, null, null, null, null, [["speech", 59.19], ["beatboxing", 13.98], ["wail, moan", 5.12]], null, null, null, null, null], "duration": [1.71, 1.09, 0.53, 17.24, 0.69, 14.6, 1.26, 1.28, 1.3, 1.79, 1.2, 0.79, 0.9, 1.08, 0.87, 1.63, 0.13, 3.27, 1.38, 2.38, 2.08, 0.75, 1.55, -0.05, 1.06, -0.02, 0.28, 25.56, 0.39, 0.55, 1.06, 0.75, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/uk04S-0HOXY_filtered.json b/annotations_filtered/uk04S-0HOXY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd67f50437c39ed28b2e442d51e846f6dfd6fea3 --- /dev/null +++ b/annotations_filtered/uk04S-0HOXY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 46.53], [49.0, 103.62]], "keep_status": [false, false], "silence_prob": [67.38, 0.0], "audiomae_on_audioset": [null, null], "duration": [20.53, 54.62]} \ No newline at end of file diff --git a/annotations_filtered/ukNsgDQKqfY_filtered.json b/annotations_filtered/ukNsgDQKqfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..619b0d6e206fe10fe2269b316bcb25f671a62327 --- /dev/null +++ b/annotations_filtered/ukNsgDQKqfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 44.74], [47.0, 52.22], [53.0, 90.26], [91.0, 91.96], [93.0, 94.07]], "keep_status": [true, false, false, false, false], "silence_prob": [32.13, 41.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.72], ["quack", 12.22], ["trombone", 3.73]], [["music", 59.62], ["didgeridoo", 11.51], ["musical instrument", 4.55]], null, null, null], "duration": [14.74, 5.22, 37.26, 0.96, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/ukOx2hZvXkE_filtered.json b/annotations_filtered/ukOx2hZvXkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5faf15604807958f07b43155c70eb357f8efa8eb --- /dev/null +++ b/annotations_filtered/ukOx2hZvXkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [6.0, 8.5], [11.0, 11.03], [14.0, 14.44], [19.0, 19.26], [21.0, 21.2], [28.0, 29.71], [33.0, 34.89], [36.0, 36.8], [39.0, 42.5], [43.0, 47.43], [48.0, 54.21], [56.0, 56.62], [58.0, 62.04], [67.0, 67.8], [70.0, 72.35], [77.0, 77.72], [79.0, 79.52], [82.0, 82.9], [85.0, 86.37], [88.0, 89.09], [91.0, 91.32], [93.0, 93.97], [96.0, 96.87], [99.0, 103.06], [104.0, 106.37], [110.0, 110.59], [115.0, 116.55], [117.0, 118.39], [119.0, 121.86], [122.0, 123.31], [126.0, 127.58], [129.0, 128.9], [131.0, 131.55], [132.0, 133.27], [136.0, 135.75], [138.0, 137.76], [141.0, 141.0], [142.0, 142.3], [143.0, 145.83], [147.0, 147.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 100.0, 100.0, 0.0, 87.19, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 99.59, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.28, 2.5, 0.03, 0.44, 0.26, 0.2, 1.71, 1.89, 0.8, 3.5, 4.43, 6.21, 0.62, 4.04, 0.8, 2.35, 0.72, 0.52, 0.9, 1.37, 1.09, 0.32, 0.97, 0.87, 4.06, 2.37, 0.59, 1.55, 1.39, 2.86, 1.31, 1.58, -0.1, 0.55, 1.27, -0.25, -0.24, 0.0, 0.3, 2.83, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/uki4lrLzRaU_filtered.json b/annotations_filtered/uki4lrLzRaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69f4a6683489821cacd6bde8c2b92f1a71089cd --- /dev/null +++ b/annotations_filtered/uki4lrLzRaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.23], [8.0, 20.21], [22.0, 23.82], [26.0, 26.79], [28.0, 29.67], [30.0, 57.96], [59.0, 61.86], [64.0, 69.38], [71.0, 72.5], [74.0, 74.56], [76.0, 83.83], [86.0, 87.44], [89.0, 90.14], [91.0, 92.74], [94.0, 112.18], [118.0, 123.69], [127.0, 138.94], [144.0, 150.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [53.84, 95.51, 0.0, 0.0, 0.0, 99.56, 99.78, 95.23, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 63.74, 39.12, 54.36, 93.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 19.93], ["buzz", 18.07], ["hum", 8.35]], null, null], "duration": [2.23, 12.21, 1.82, 0.79, 1.67, 27.96, 2.86, 5.38, 1.5, 0.56, 7.83, 1.44, 1.14, 1.74, 18.18, 5.69, 11.94, 6.11]} \ No newline at end of file diff --git a/annotations_filtered/ukl9qBvRXfc_filtered.json b/annotations_filtered/ukl9qBvRXfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbd14d2ddec900c794c374b7e753d8d97d99caf5 --- /dev/null +++ b/annotations_filtered/ukl9qBvRXfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [4.0, 4.09], [8.0, 9.04], [20.0, 27.06], [28.0, 28.14], [33.0, 33.35], [45.0, 46.06], [50.0, 53.94], [55.0, 54.94], [59.0, 61.15], [62.0, 62.01], [102.0, 102.24], [112.0, 112.92], [118.0, 119.48], [121.0, 121.51], [122.0, 123.4], [128.0, 128.71], [130.0, 131.95], [137.0, 140.68], [142.0, 145.93], [148.0, 149.3], [150.0, 150.3], [155.0, 159.92], [161.0, 161.92], [162.0, 167.68]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.32, 0.0, 0.0, 0.0, 42.93, 0.0, 36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 34.4, 0.0, 0.0, 41.87, 0.0, 45.27], "audiomae_on_audioset": [null, null, null, [["music", 47.57], ["speech", 28.52], ["electronic music", 3.06]], null, null, null, [["speech", 42.82], ["music", 22.25], ["wood", 2.14]], null, [["music", 54.42], ["synthesizer", 3.23], ["hum", 1.81]], null, null, null, null, null, null, null, null, null, [["music", 46.51], ["speech", 32.22], ["musical instrument", 2.09]], null, null, [["moo", 25.69], ["music", 19.6], ["cattle, bovinae", 18.95]], null, [["music", 50.11], ["ambient music", 29.17], ["electronic music", 4.41]]], "duration": [0.33, 0.09, 1.04, 7.06, 0.14, 0.35, 1.06, 3.94, -0.06, 2.15, 0.01, 0.24, 0.92, 1.48, 0.51, 1.4, 0.71, 1.95, 3.68, 3.93, 1.3, 0.3, 4.92, 0.92, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/ukmrk8JdGxk_filtered.json b/annotations_filtered/ukmrk8JdGxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..607fa6a718c27b3bafd4b54af7d9399c4baf38d8 --- /dev/null +++ b/annotations_filtered/ukmrk8JdGxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [6.0, 7.77], [18.0, 19.26], [23.0, 22.96], [24.0, 26.4], [30.0, 31.06], [34.0, 34.21], [37.0, 38.03], [39.0, 40.91], [42.0, 42.84], [48.0, 48.71], [50.0, 50.41], [52.0, 58.14], [60.0, 62.82], [65.0, 66.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 97.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 1.77, 1.26, -0.04, 2.4, 1.06, 0.21, 1.03, 1.91, 0.84, 0.71, 0.41, 6.14, 2.82, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/ukzIFp4Kj90_filtered.json b/annotations_filtered/ukzIFp4Kj90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b05156457522f86101d3237fac1e6bf7a17b7da1 --- /dev/null +++ b/annotations_filtered/ukzIFp4Kj90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.33], [17.0, 18.76], [26.0, 26.77], [28.0, 29.96], [30.0, 30.84], [32.0, 33.03], [36.0, 39.55], [41.0, 42.6], [44.0, 46.28], [48.0, 48.46], [50.0, 50.4], [52.0, 54.13], [57.0, 58.73], [60.0, 60.22], [62.0, 66.73], [68.0, 69.74], [70.0, 70.9], [72.0, 72.86], [74.0, 76.11], [80.0, 80.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.71, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 98.93, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [[["speech", 80.63], ["bouncing", 6.37], ["fart", 1.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.33, 1.76, 0.77, 1.96, 0.84, 1.03, 3.55, 1.6, 2.28, 0.46, 0.4, 2.13, 1.73, 0.22, 4.73, 1.74, 0.9, 0.86, 2.11, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/ulFxMs35-P0_filtered.json b/annotations_filtered/ulFxMs35-P0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2d4177677fbb7e4d70a86ef725aafcfea5c1eb3 --- /dev/null +++ b/annotations_filtered/ulFxMs35-P0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.92], [30.0, 30.74], [35.0, 47.9], [50.0, 49.64], [50.0, 53.4], [55.0, 80.13], [81.0, 81.45], [82.0, 92.21]], "keep_status": [false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 30.02, 0.0, 31.16, 32.09, 0.0, 29.36], "audiomae_on_audioset": [null, null, [["music", 49.51], ["smash, crash", 12.59], ["thump, thud", 11.66]], null, [["music", 38.72], ["hum", 18.29], ["throbbing", 10.35]], [["speech", 21.97], ["hum", 18.1], ["mains hum", 16.36]], null, [["speech", 27.4], ["music", 26.17], ["hum", 11.78]]], "duration": [0.92, 0.74, 12.9, -0.36, 3.4, 25.13, 0.45, 10.21]} \ No newline at end of file diff --git a/annotations_filtered/ulGMlIZNr6M_filtered.json b/annotations_filtered/ulGMlIZNr6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e14e3bc95cbb0054777483e9caa32ca1d151ebb5 --- /dev/null +++ b/annotations_filtered/ulGMlIZNr6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.32], [11.0, 11.43], [12.0, 14.0], [24.0, 23.94], [25.0, 25.83], [27.0, 30.06], [31.0, 35.78], [39.0, 39.12], [45.0, 47.88]], "keep_status": [true, false, true, false, false, false, true, false, true], "silence_prob": [32.13, 0.0, 33.94, 0.0, 0.0, 34.36, 31.72, 0.0, 36.58], "audiomae_on_audioset": [[["music", 53.7], ["musical instrument", 4.94], ["ice cream truck, ice cream van", 3.56]], null, [["music", 35.98], ["foghorn", 7.47], ["speech", 4.58]], null, null, [["music", 34.92], ["didgeridoo", 32.85], ["grunt", 5.78]], [["music", 33.13], ["whale vocalization", 15.66], ["speech", 14.33]], null, [["music", 48.32], ["stomach rumble", 9.99], ["brass instrument", 3.31]]], "duration": [2.32, 0.43, 2.0, -0.06, 0.83, 3.06, 4.78, 0.12, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/ulJXiB5i_q0_filtered.json b/annotations_filtered/ulJXiB5i_q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07695e22074e15a3fffb6b164d15fe0c64cad8a0 --- /dev/null +++ b/annotations_filtered/ulJXiB5i_q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.56], [7.0, 10.18], [12.0, 14.71], [18.0, 18.89], [21.0, 23.52], [26.0, 28.41], [30.0, 37.23], [41.0, 56.19], [61.0, 63.69], [68.0, 68.74], [70.0, 71.2], [73.0, 73.53], [76.0, 79.37], [83.0, 86.98], [90.0, 94.2], [96.0, 96.74], [97.0, 99.27], [100.0, 102.71], [107.0, 107.0], [107.0, 107.13], [107.0, 108.33], [114.0, 118.44], [124.0, 126.4], [130.0, 134.03], [135.0, 137.52], [139.0, 141.98], [146.0, 159.04], [164.0, 165.97], [170.0, 172.64], [184.0, 188.43], [192.0, 197.19], [201.0, 202.69], [214.0, 216.31], [232.0, 239.97], [241.0, 242.91], [243.0, 244.76], [246.0, 247.18], [248.0, 259.31], [261.0, 265.06], [266.0, 273.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [100.0, 100.0, 100.0, 0.0, 99.98, 95.23, 100.0, 79.59, 60.6, 0.0, 0.0, 0.0, 38.55, 82.25, 40.54, 0.0, 67.13, 89.9, 0.0, 0.0, 0.0, 64.18, 73.67, 30.43, 48.56, 89.36, 30.33, 0.0, 39.7, 32.7, 34.51, 0.0, 32.34, 36.52, 0.0, 0.0, 0.0, 43.08, 50.97, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.65], ["humming", 4.71], ["lullaby", 4.02]], null, [["music", 57.45], ["theremin", 5.99], ["humming", 4.69]], null, null, null, null, null, null, null, null, [["music", 35.6], ["musical instrument", 4.76], ["effects unit", 4.58]], [["fly, housefly", 24.55], ["insect", 15.67], ["music", 13.03]], null, [["music", 51.64], ["theremin", 34.98], ["synthesizer", 1.9]], null, [["music", 72.55], ["musical instrument", 4.35], ["cello", 1.92]], [["music", 38.5], ["brass instrument", 16.58], ["trombone", 12.36]], [["music", 44.58], ["cello", 9.06], ["theremin", 8.57]], null, [["music", 53.27], ["didgeridoo", 17.73], ["theremin", 14.61]], [["theremin", 65.51], ["music", 26.52], ["singing", 0.65]], null, null, null, [["music", 35.08], ["effects unit", 10.06], ["singing", 6.43]], null, null], "duration": [2.56, 3.18, 2.71, 0.89, 2.52, 2.41, 7.23, 15.19, 2.69, 0.74, 1.2, 0.53, 3.37, 3.98, 4.2, 0.74, 2.27, 2.71, 0.0, 0.13, 1.33, 4.44, 2.4, 4.03, 2.52, 2.98, 13.04, 1.97, 2.64, 4.43, 5.19, 1.69, 2.31, 7.97, 1.91, 1.76, 1.18, 11.31, 4.06, 7.67]} \ No newline at end of file diff --git a/annotations_filtered/ulLxPcOmDmU_filtered.json b/annotations_filtered/ulLxPcOmDmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edacdde3f8e5a0a82b79f24e616b49b4eaf65914 --- /dev/null +++ b/annotations_filtered/ulLxPcOmDmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 132.7], [134.0, 133.64], [134.0, 144.69]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 84.98], "audiomae_on_audioset": [null, null, null], "duration": [118.7, -0.36, 10.69]} \ No newline at end of file diff --git a/annotations_filtered/ulMNuwN1C-8_filtered.json b/annotations_filtered/ulMNuwN1C-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f85350a5aba056ab6f03f2458990e62c1848a74 --- /dev/null +++ b/annotations_filtered/ulMNuwN1C-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.83], [20.0, 19.92], [30.0, 30.82], [33.0, 33.37], [41.0, 42.45], [46.0, 46.21], [54.0, 55.76], [58.0, 58.46], [60.0, 61.6], [62.0, 63.15], [65.0, 65.47], [67.0, 69.53], [70.0, 72.06], [73.0, 74.28], [81.0, 81.63], [85.0, 87.52], [91.0, 92.06], [93.0, 94.74], [96.0, 98.96], [99.0, 99.0], [99.0, 101.22], [103.0, 104.48], [105.0, 105.93], [108.0, 109.05], [117.0, 123.89], [127.0, 128.21], [128.0, 128.31], [128.0, 128.98], [131.0, 133.79], [135.0, 135.45], [136.0, 137.57], [140.0, 143.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [71.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 57.64, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 84.98, 0.0, 0.0, 0.0, 37.45, 0.0, 0.0, 0.0, 34.88, 0.0, 0.0, 66.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cowbell", 72.29], ["music", 11.62], ["didgeridoo", 2.1]], null, null, null, [["fly, housefly", 26.16], ["mosquito", 14.36], ["insect", 10.53]], null, null, null], "duration": [2.83, -0.08, 0.82, 0.37, 1.45, 0.21, 1.76, 0.46, 1.6, 1.15, 0.47, 2.53, 2.06, 1.28, 0.63, 2.52, 1.06, 1.74, 2.96, 0.0, 2.22, 1.48, 0.93, 1.05, 6.89, 1.21, 0.31, 0.98, 2.79, 0.45, 1.57, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/ul_HuCZxxNU_filtered.json b/annotations_filtered/ul_HuCZxxNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94d2f22eaba863084db363e0d70434cf76d8a409 --- /dev/null +++ b/annotations_filtered/ul_HuCZxxNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.44], [39.0, 40.17], [49.0, 53.23], [53.0, 53.27]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 32.39, 0.0], "audiomae_on_audioset": [null, null, [["speech", 55.2], ["music", 17.68], ["breaking", 17.0]], null], "duration": [0.44, 1.17, 4.23, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/ulwUkaKjgY0_filtered.json b/annotations_filtered/ulwUkaKjgY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..978d70369d03276ebd9ace3769fc7835143e279d --- /dev/null +++ b/annotations_filtered/ulwUkaKjgY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.61], [21.0, 23.09], [25.0, 25.44], [33.0, 36.51], [38.0, 39.18], [40.0, 39.88], [40.0, 40.88], [42.0, 41.79], [53.0, 61.96], [66.0, 66.02], [68.0, 69.52], [71.0, 72.32], [74.0, 74.76], [77.0, 77.3], [85.0, 85.43], [89.0, 89.41], [94.0, 95.74], [104.0, 107.37], [109.0, 109.93], [118.0, 118.22], [119.0, 119.92], [121.0, 124.97], [125.0, 125.93], [127.0, 128.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 76.78], ["knock", 5.45], ["hammer", 3.05]], null, null, null, null, null, null, null, null, [["speech", 57.53], ["thunk", 17.91], ["whack, thwack", 5.95]], null, null, null, null, null, null], "duration": [0.61, 2.09, 0.44, 3.51, 1.18, -0.12, 0.88, -0.21, 8.96, 0.02, 1.52, 1.32, 0.76, 0.3, 0.43, 0.41, 1.74, 3.37, 0.93, 0.22, 0.92, 3.97, 0.93, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/um3tlxmK7Cg_filtered.json b/annotations_filtered/um3tlxmK7Cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80aa6104025c63690cd4bf6bc3dacf8082d27093 --- /dev/null +++ b/annotations_filtered/um3tlxmK7Cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.38], [8.0, 12.99], [20.0, 19.62], [25.0, 24.88], [32.0, 49.28], [50.0, 51.04], [52.0, 58.78], [59.0, 59.56], [62.0, 67.14], [68.0, 68.55], [70.0, 70.98], [74.0, 75.42], [76.0, 75.52], [76.0, 77.99], [86.0, 90.26], [91.0, 91.12], [91.0, 91.32], [96.0, 103.59], [105.0, 110.96]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [36.61, 44.49, 0.0, 0.0, 30.07, 0.0, 31.35, 0.0, 31.21, 0.0, 0.0, 0.0, 0.0, 0.0, 35.81, 0.0, 0.0, 37.93, 34.19], "audiomae_on_audioset": [[["speech", 61.94], ["music", 6.32], ["splash, splatter", 3.85]], [["music", 38.77], ["speech", 18.09], ["sidetone", 4.83]], null, null, [["speech", 44.18], ["buzz", 14.56], ["didgeridoo", 14.39]], null, [["livestock, farm animals, working animals", 58.32], ["cattle, bovinae", 20.33], ["moo", 12.91]], null, [["roaring cats (lions, tigers)", 18.05], ["moo", 13.87], ["cattle, bovinae", 13.48]], null, null, null, null, null, [["speech", 20.96], ["music", 18.05], ["noise", 12.44]], null, null, [["music", 47.64], ["livestock, farm animals, working animals", 16.26], ["cattle, bovinae", 4.29]], [["music", 30.64], ["synthesizer", 11.7], ["whale vocalization", 10.52]]], "duration": [2.38, 4.99, -0.38, -0.12, 17.28, 1.04, 6.78, 0.56, 5.14, 0.55, 0.98, 1.42, -0.48, 1.99, 4.26, 0.12, 0.32, 7.59, 5.96]} \ No newline at end of file diff --git a/annotations_filtered/umIBbT6uwZI_filtered.json b/annotations_filtered/umIBbT6uwZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1427f30bbba344f00b6f00325aee6f77e36dfd8f --- /dev/null +++ b/annotations_filtered/umIBbT6uwZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [19.0, 19.75], [21.0, 26.65], [28.0, 32.0], [34.0, 34.82], [35.0, 43.63], [44.0, 48.32], [51.0, 60.2], [62.0, 71.74], [84.0, 93.6], [98.0, 102.37], [104.0, 106.2], [114.0, 122.79], [125.0, 131.03], [132.0, 133.27], [135.0, 137.98], [139.0, 142.48], [145.0, 147.21], [148.0, 158.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.08, 91.81, 0.0, 40.97, 39.99, 38.25, 35.16, 36.17, 35.77, 73.21, 34.23, 49.36, 0.0, 92.15, 63.21, 84.25, 35.76], "audiomae_on_audioset": [null, null, null, null, null, [["music", 41.98], ["speech", 33.28], ["didgeridoo", 3.62]], [["music", 40.55], ["quack", 20.78], ["whip", 6.3]], [["music", 55.64], ["fart", 26.35], ["didgeridoo", 5.91]], [["music", 60.61], ["synthesizer", 7.58], ["didgeridoo", 6.81]], [["music", 69.24], ["didgeridoo", 8.26], ["musical instrument", 5.14]], [["music", 49.72], ["speech", 16.38], ["quack", 6.91]], null, [["music", 55.82], ["didgeridoo", 18.05], ["speech", 3.65]], [["music", 57.87], ["brass instrument", 7.64], ["didgeridoo", 5.54]], null, null, null, null, [["music", 75.38], ["didgeridoo", 9.48], ["quack", 2.52]]], "duration": [0.33, 0.75, 5.65, 4.0, 0.82, 8.63, 4.32, 9.2, 9.74, 9.6, 4.37, 2.2, 8.79, 6.03, 1.27, 2.98, 3.48, 2.21, 10.21]} \ No newline at end of file diff --git a/annotations_filtered/umKFAbLoUxQ_filtered.json b/annotations_filtered/umKFAbLoUxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe4b9f97b37521ae8f21162a57e5d931a8e8fb0a --- /dev/null +++ b/annotations_filtered/umKFAbLoUxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.43], [25.0, 30.37], [32.0, 33.89], [34.0, 33.94], [34.0, 34.16], [35.0, 35.9], [37.0, 38.2], [41.0, 41.22], [44.0, 51.06], [52.0, 55.0], [57.0, 60.96], [64.0, 65.5], [67.0, 68.18], [69.0, 72.01], [73.0, 76.99], [78.0, 78.6], [80.0, 81.87], [84.0, 84.77], [87.0, 88.05], [89.0, 89.85], [90.0, 90.46], [92.0, 95.39], [97.0, 98.85], [101.0, 101.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 42.02, 63.21, 0.0, 0.0, 89.01, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 44.7], ["didgeridoo", 24.26], ["theremin", 3.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.43, 5.37, 1.89, -0.06, 0.16, 0.9, 1.2, 0.22, 7.06, 3.0, 3.96, 1.5, 1.18, 3.01, 3.99, 0.6, 1.87, 0.77, 1.05, 0.85, 0.46, 3.39, 1.85, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/umOy9nT4Wpw_filtered.json b/annotations_filtered/umOy9nT4Wpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..345a4db4b53b75a25066483fecda4cce19b5abda --- /dev/null +++ b/annotations_filtered/umOy9nT4Wpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.46], [27.0, 28.63], [30.0, 30.5], [31.0, 32.09], [33.0, 34.3]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.46, 1.63, 0.5, 1.09, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/umcyzRBeJtE_filtered.json b/annotations_filtered/umcyzRBeJtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7ba94562f2d505c8cda466ca6715be9badd5618 --- /dev/null +++ b/annotations_filtered/umcyzRBeJtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [20.0, 21.03], [38.0, 41.34], [43.0, 43.21], [45.0, 47.36], [49.0, 48.88], [63.0, 65.47], [71.0, 71.9], [73.0, 73.41], [76.0, 78.19], [81.0, 81.5], [86.0, 88.94], [90.0, 91.62], [92.0, 92.67], [96.0, 96.23], [98.0, 99.47], [101.0, 101.09], [103.0, 103.5], [106.0, 106.37], [107.0, 107.82], [108.0, 108.73], [113.0, 113.1], [114.0, 114.99], [116.0, 116.28], [119.0, 119.64], [123.0, 123.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.98, 0.0, 51.55, 0.0, 83.7, 0.0, 0.0, 77.53, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.88], ["timpani", 3.54], ["inside, small room", 3.07]], null, null, null, null, null, null, null, null, [["music", 23.0], ["hum", 14.14], ["gong", 11.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.03, 3.34, 0.21, 2.36, -0.12, 2.47, 0.9, 0.41, 2.19, 0.5, 2.94, 1.62, 0.67, 0.23, 1.47, 0.09, 0.5, 0.37, 0.82, 0.73, 0.1, 0.99, 0.28, 0.64, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/umjmV3SwDjw_filtered.json b/annotations_filtered/umjmV3SwDjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37f2f31e5fb6697f7669eccffe99e2b1b080150d --- /dev/null +++ b/annotations_filtered/umjmV3SwDjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [21.0, 22.08], [22.0, 25.68], [26.0, 26.64], [28.0, 28.85], [33.0, 38.13], [40.0, 40.32], [49.0, 49.1], [57.0, 57.42], [62.0, 63.34], [68.0, 67.78], [74.0, 74.46], [75.0, 75.66], [80.0, 87.91], [93.0, 94.2], [107.0, 107.59], [111.0, 112.68], [116.0, 116.38], [117.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 50.36, 0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.85, 0.0, 0.0, 0.0, 0.0, 30.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 30.84], ["speech", 16.28], ["livestock, farm animals, working animals", 6.43]], null, null, null, null, [["speech", 25.98], ["explosion", 23.71], ["burst, pop", 8.0]]], "duration": [0.72, 1.08, 3.68, 0.64, 0.85, 5.13, 0.32, 0.1, 0.42, 1.34, -0.22, 0.46, 0.66, 7.91, 1.2, 0.59, 1.68, 0.38, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/unWr90pLIvc_filtered.json b/annotations_filtered/unWr90pLIvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8e67f0313b1866e6a2c403b6d444582fa1884db --- /dev/null +++ b/annotations_filtered/unWr90pLIvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 33.94], [35.0, 37.3], [38.0, 41.27], [43.0, 44.86], [47.0, 49.6], [50.0, 63.88], [70.0, 85.99], [87.0, 90.0], [91.0, 93.21], [97.0, 99.22], [101.0, 102.44], [110.0, 112.65], [114.0, 116.07], [130.0, 136.61], [137.0, 137.96], [140.0, 144.49], [156.0, 156.39], [159.0, 160.05], [171.0, 174.6], [187.0, 188.0], [188.0, 188.69], [189.0, 195.57], [197.0, 199.77], [200.0, 203.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 84.43, 0.0, 78.21, 66.15, 71.0, 67.25, 69.2, 77.7, 0.0, 86.27, 73.36, 76.7, 0.0, 78.72, 0.0, 0.0, 61.87, 0.0, 0.0, 81.71, 68.54, 53.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.94, 2.3, 3.27, 1.86, 2.6, 13.88, 15.99, 3.0, 2.21, 2.22, 1.44, 2.65, 2.07, 6.61, 0.96, 4.49, 0.39, 1.05, 3.6, 1.0, 0.69, 6.57, 2.77, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/undTPa_iq1Y_filtered.json b/annotations_filtered/undTPa_iq1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fdc4384c642194c4e59906b2b59789120754bfa --- /dev/null +++ b/annotations_filtered/undTPa_iq1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.43], [9.0, 15.97], [18.0, 18.6], [19.0, 21.84], [23.0, 24.54], [26.0, 27.55], [29.0, 32.12], [34.0, 36.91], [39.0, 53.45], [55.0, 56.05], [56.0, 57.11], [59.0, 60.05], [61.0, 63.19], [64.0, 65.77], [67.0, 68.4], [70.0, 70.97], [74.0, 74.92], [76.0, 77.31], [79.0, 82.26], [83.0, 86.04], [87.0, 89.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.6, 65.09, 0.0, 94.95, 0.0, 0.0, 99.91, 54.76, 60.23, 0.0, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 99.87, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.08], ["inside, small room", 2.67], ["stomach rumble", 2.51]], null, null, null, null, null, null, null, null], "duration": [2.43, 6.97, 0.6, 2.84, 1.54, 1.55, 3.12, 2.91, 14.45, 1.05, 1.11, 1.05, 2.19, 1.77, 1.4, 0.97, 0.92, 1.31, 3.26, 3.04, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/unl0GXfJRLA_filtered.json b/annotations_filtered/unl0GXfJRLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..170ee45c2ab2948fe615e841fc93758b74386c45 --- /dev/null +++ b/annotations_filtered/unl0GXfJRLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [2.0, 3.35], [40.0, 39.83], [41.0, 41.77], [44.0, 44.17], [49.0, 49.62]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.49, 1.35, -0.17, 0.77, 0.17, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/uopLUlluf-I_filtered.json b/annotations_filtered/uopLUlluf-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1f4948a88b0e18e54402fb009d0df39c1da56b5 --- /dev/null +++ b/annotations_filtered/uopLUlluf-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.52], [11.0, 13.95], [23.0, 25.83], [27.0, 29.2], [33.0, 35.13], [39.0, 39.63], [42.0, 43.87], [48.0, 51.21], [57.0, 57.33], [61.0, 64.37], [65.0, 67.26], [70.0, 71.19], [72.0, 72.99], [73.0, 77.25], [79.0, 82.59], [88.0, 91.91], [92.0, 91.99], [92.0, 95.5], [96.0, 99.96], [103.0, 107.89], [111.0, 118.88], [121.0, 122.37], [123.0, 124.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.1, 100.0, 71.87, 63.96, 100.0, 0.0, 0.0, 87.37, 0.0, 100.0, 95.64, 0.0, 0.0, 100.0, 100.0, 98.93, 0.0, 96.42, 91.81, 99.87, 71.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.52, 2.95, 2.83, 2.2, 2.13, 0.63, 1.87, 3.21, 0.33, 3.37, 2.26, 1.19, 0.99, 4.25, 3.59, 3.91, -0.01, 3.5, 3.96, 4.89, 7.88, 1.37, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/uopoXtR0Kjk_filtered.json b/annotations_filtered/uopoXtR0Kjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d396725052b810a55077022a492c6407b8cb57ff --- /dev/null +++ b/annotations_filtered/uopoXtR0Kjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [5.0, 10.45], [13.0, 14.44], [15.0, 16.29], [17.0, 18.6], [20.0, 22.76], [36.0, 37.94], [41.0, 42.52], [44.0, 45.89], [54.0, 60.44], [62.0, 64.29], [66.0, 65.99], [67.0, 68.35], [69.0, 69.74], [70.0, 82.38], [86.0, 86.17], [88.0, 92.94], [106.0, 107.65], [108.0, 108.43], [111.0, 111.65], [112.0, 112.9], [117.0, 117.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 89.54, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 92.64, 81.71, 0.0, 0.0, 0.0, 35.8, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.04], ["foghorn", 15.96], ["speech", 9.88]], null, [["music", 33.22], ["didgeridoo", 28.84], ["mains hum", 5.97]], null, null, null, null, null], "duration": [0.91, 5.45, 1.44, 1.29, 1.6, 2.76, 1.94, 1.52, 1.89, 6.44, 2.29, -0.01, 1.35, 0.74, 12.38, 0.17, 4.94, 1.65, 0.43, 0.65, 0.9, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/up1wTd5shfc_filtered.json b/annotations_filtered/up1wTd5shfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd562b5fd2aab93ddd399bb588ed8bffa0931ece --- /dev/null +++ b/annotations_filtered/up1wTd5shfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.93], [11.0, 41.47], [42.0, 42.67], [44.0, 48.46], [50.0, 51.17], [52.0, 53.57], [55.0, 57.23], [63.0, 64.67], [75.0, 74.85], [79.0, 80.54], [89.0, 91.29], [94.0, 109.17], [112.0, 116.31], [117.0, 126.98], [128.0, 130.23], [132.0, 132.54], [135.0, 136.86], [138.0, 138.38], [141.0, 158.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [54.5, 0.0, 0.0, 97.54, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 99.16, 47.2, 57.17, 50.86, 53.78, 0.0, 0.0, 0.0, 34.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.47], ["musical instrument", 4.15], ["didgeridoo", 3.98]], null, null, null, null, null, null, [["music", 44.66], ["throbbing", 8.24], ["synthesizer", 6.25]]], "duration": [7.93, 30.47, 0.67, 4.46, 1.17, 1.57, 2.23, 1.67, -0.15, 1.54, 2.29, 15.17, 4.31, 9.98, 2.23, 0.54, 1.86, 0.38, 17.21]} \ No newline at end of file diff --git a/annotations_filtered/up5GI3Sp7Lo_filtered.json b/annotations_filtered/up5GI3Sp7Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fc1b4b2464d2120b41b39ea2b30b6c5732181e1 --- /dev/null +++ b/annotations_filtered/up5GI3Sp7Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 40.24], [42.0, 42.6], [44.0, 57.23], [58.0, 61.62], [62.0, 65.89], [67.0, 67.47], [71.0, 72.54], [74.0, 86.95], [89.0, 103.25]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [32.3, 0.0, 33.43, 95.23, 50.36, 0.0, 0.0, 68.15, 31.8], "audiomae_on_audioset": [[["music", 45.39], ["boing", 9.51], ["whack, thwack", 6.96]], null, [["music", 68.88], ["throbbing", 8.46], ["hum", 5.33]], null, null, null, null, null, [["music", 31.34], ["cowbell", 14.74], ["livestock, farm animals, working animals", 7.61]]], "duration": [5.24, 0.6, 13.23, 3.62, 3.89, 0.47, 1.54, 12.95, 14.25]} \ No newline at end of file diff --git a/annotations_filtered/up7I_0JGTgQ_filtered.json b/annotations_filtered/up7I_0JGTgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bdb5bc53759d985f22d80c0f0372d92982420de --- /dev/null +++ b/annotations_filtered/up7I_0JGTgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 48.02], [51.0, 61.08], [62.0, 62.09], [63.0, 66.68], [67.0, 70.17], [72.0, 72.77], [75.0, 79.83], [83.0, 105.48], [106.0, 106.83], [108.0, 114.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.87, 0.0, 35.89, 35.53, 0.0, 35.59, 35.39, 0.0, 36.72], "audiomae_on_audioset": [null, [["music", 48.18], ["brass instrument", 16.27], ["musical instrument", 7.99]], null, [["music", 65.18], ["boing", 3.29], ["music of latin america", 2.3]], [["music", 53.47], ["harmonica", 13.98], ["carnatic music", 3.53]], null, [["music", 72.33], ["didgeridoo", 4.79], ["trombone", 2.95]], [["music", 73.58], ["swing music", 5.13], ["musical instrument", 4.99]], null, [["music", 73.16], ["swing music", 4.92], ["musical instrument", 4.12]]], "duration": [0.02, 10.08, 0.09, 3.68, 3.17, 0.77, 4.83, 22.48, 0.83, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/upPFFVaVSY4_filtered.json b/annotations_filtered/upPFFVaVSY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48dd8a864caaa34876d7140a3352d04617503bf9 --- /dev/null +++ b/annotations_filtered/upPFFVaVSY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.21], [29.0, 29.32], [31.0, 33.4], [36.0, 37.17], [45.0, 48.41], [52.0, 59.1], [63.0, 64.57], [66.0, 67.68], [68.0, 69.47], [74.0, 75.03], [82.0, 86.32], [90.0, 91.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [38.52, 0.0, 40.7, 0.0, 52.1, 93.45, 0.0, 0.0, 0.0, 0.0, 42.3, 0.0], "audiomae_on_audioset": [[["mains hum", 32.4], ["hum", 26.43], ["music", 9.95]], null, [["frog", 26.73], ["sidetone", 25.13], ["speech", 21.95]], null, null, null, null, null, null, null, [["noise", 24.25], ["music", 14.5], ["effects unit", 12.38]], null], "duration": [4.21, 0.32, 2.4, 1.17, 3.41, 7.1, 1.57, 1.68, 1.47, 1.03, 4.32, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/upoh7LbKZR0_filtered.json b/annotations_filtered/upoh7LbKZR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1b1b0a0cec6ccf000245b8116af66c25d12794 --- /dev/null +++ b/annotations_filtered/upoh7LbKZR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [6.0, 5.97], [6.0, 6.88], [8.0, 8.95], [10.0, 10.57], [12.0, 13.31], [14.0, 30.4], [37.0, 37.45], [38.0, 42.69], [43.0, 43.73], [45.0, 45.62], [46.0, 46.95], [47.0, 47.95], [49.0, 50.14], [51.0, 51.9], [53.0, 53.0], [55.0, 54.9], [55.0, 55.9], [57.0, 57.2], [58.0, 58.75], [60.0, 60.4], [62.0, 62.56], [63.0, 63.15], [65.0, 66.28], [72.0, 72.59], [73.0, 74.41], [76.0, 76.71], [79.0, 79.59], [84.0, 84.23], [86.0, 86.19], [87.0, 87.59], [89.0, 89.53], [92.0, 101.7], [102.0, 102.91], [104.0, 104.46], [106.0, 106.44], [112.0, 112.13], [113.0, 113.73], [115.0, 118.76], [126.0, 145.56], [147.0, 147.01], [147.0, 152.49]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 64.63, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.59], ["ambient music", 11.11], ["didgeridoo", 6.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 22.59], ["hum", 18.95], ["heart murmur", 10.94]], null, null, null, null, null, [["music", 32.71], ["synthesizer", 9.45], ["sidetone", 9.16]], null, null, null], "duration": [1.09, -0.03, 0.88, 0.95, 0.57, 1.31, 16.4, 0.45, 4.69, 0.73, 0.62, 0.95, 0.95, 1.14, 0.9, 0.0, -0.1, 0.9, 0.2, 0.75, 0.4, 0.56, 0.15, 1.28, 0.59, 1.41, 0.71, 0.59, 0.23, 0.19, 0.59, 0.53, 9.7, 0.91, 0.46, 0.44, 0.13, 0.73, 3.76, 19.56, 0.01, 5.49]} \ No newline at end of file diff --git a/annotations_filtered/upwUN92OAQU_filtered.json b/annotations_filtered/upwUN92OAQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..736c5c095baa0bb6415089987eb9cea4d6a711e4 --- /dev/null +++ b/annotations_filtered/upwUN92OAQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.42]], "keep_status": [false], "silence_prob": [94.37], "audiomae_on_audioset": [null], "duration": [2.42]} \ No newline at end of file diff --git a/annotations_filtered/upyAJ-kEgNY_filtered.json b/annotations_filtered/upyAJ-kEgNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e605ef8a59497b0811ea172431843c3ccc711041 --- /dev/null +++ b/annotations_filtered/upyAJ-kEgNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 75.52], [85.0, 126.69]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [36.52, 41.69]} \ No newline at end of file diff --git a/annotations_filtered/uq1JHKlUtOU_filtered.json b/annotations_filtered/uq1JHKlUtOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24892beaa400486317fe10371fffdaa8c4b35ab0 --- /dev/null +++ b/annotations_filtered/uq1JHKlUtOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.95], [17.0, 17.81], [27.0, 32.27], [36.0, 41.81], [43.0, 45.37], [53.0, 52.78], [58.0, 60.72], [62.0, 61.86], [70.0, 70.53], [72.0, 73.55], [76.0, 79.61], [81.0, 81.24], [82.0, 83.73], [89.0, 89.53]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.49, 63.96, 54.7, 0.0, 99.62, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 30.93], ["sidetone", 23.76], ["sine wave", 11.83]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 0.81, 5.27, 5.81, 2.37, -0.22, 2.72, -0.14, 0.53, 1.55, 3.61, 0.24, 1.73, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/uqS2-v7iZr8_filtered.json b/annotations_filtered/uqS2-v7iZr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d1d92b9de394bf55fe8e1dad255aa8124b48c7 --- /dev/null +++ b/annotations_filtered/uqS2-v7iZr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.18], [15.0, 14.94], [15.0, 16.04], [18.0, 50.72], [52.0, 58.11], [60.0, 61.05], [63.0, 64.05], [69.0, 69.48], [73.0, 74.65], [76.0, 78.21], [82.0, 86.46], [88.0, 98.56], [100.0, 114.32], [116.0, 115.99], [117.0, 120.51], [121.0, 122.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.51, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 45.56, 41.46, 35.82, 34.14, 0.0, 62.17, 0.0], "audiomae_on_audioset": [[["music", 57.39], ["didgeridoo", 6.55], ["musical instrument", 4.94]], null, null, null, null, null, null, null, null, [["music", 52.26], ["theremin", 18.01], ["musical instrument", 8.12]], [["music", 39.35], ["cello", 32.76], ["double bass", 10.67]], [["music", 32.47], ["hum", 20.09], ["mains hum", 14.14]], [["theremin", 87.37], ["music", 8.2], ["musical instrument", 1.1]], null, null, null], "duration": [3.18, -0.06, 1.04, 32.72, 6.11, 1.05, 1.05, 0.48, 1.65, 2.21, 4.46, 10.56, 14.32, -0.01, 3.51, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/uqVEYJGg3J0_filtered.json b/annotations_filtered/uqVEYJGg3J0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fee5add04e5cca4820bcfcaec27c797cbdb0f5e --- /dev/null +++ b/annotations_filtered/uqVEYJGg3J0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [8.0, 9.39], [10.0, 10.37], [13.0, 13.61], [18.0, 19.68], [22.0, 23.35], [25.0, 25.95], [40.0, 40.71], [42.0, 43.43], [46.0, 47.36], [50.0, 52.02], [52.0, 58.19], [63.0, 67.15], [69.0, 69.43], [73.0, 73.63], [76.0, 77.01], [83.0, 84.77], [87.0, 87.98], [91.0, 93.65], [100.0, 101.92], [103.0, 104.23], [106.0, 107.42], [109.0, 109.22], [111.0, 111.42], [112.0, 112.58], [116.0, 118.25], [121.0, 122.07], [124.0, 126.35], [135.0, 136.0], [138.0, 139.18], [141.0, 141.08], [146.0, 145.67], [150.0, 150.53], [153.0, 155.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 58.89, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 32.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.06], ["radio", 25.01], ["sidetone", 2.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.39, 0.37, 0.61, 1.68, 1.35, 0.95, 0.71, 1.43, 1.36, 2.02, 6.19, 4.15, 0.43, 0.63, 1.01, 1.77, 0.98, 2.65, 1.92, 1.23, 1.42, 0.22, 0.42, 0.58, 2.25, 1.07, 2.35, 1.0, 1.18, 0.08, -0.33, 0.53, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/uqeGxkIdBiY_filtered.json b/annotations_filtered/uqeGxkIdBiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9717a985fd109cb45904b986940241544242041b --- /dev/null +++ b/annotations_filtered/uqeGxkIdBiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 67.51], [71.0, 73.6], [77.0, 77.19], [82.0, 110.83]], "keep_status": [false, false, false, false], "silence_prob": [73.67, 80.46, 0.0, 49.22], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 96.36], ["gurgling", 0.71], ["speech", 0.37]]], "duration": [10.51, 2.6, 0.19, 28.83]} \ No newline at end of file diff --git a/annotations_filtered/ur0U4xN0d_A_filtered.json b/annotations_filtered/ur0U4xN0d_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7766626bb2260d20927f798a0d0ee9a8e16c76a0 --- /dev/null +++ b/annotations_filtered/ur0U4xN0d_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.73], [15.0, 16.23], [18.0, 22.54], [23.0, 24.19], [32.0, 33.02], [33.0, 36.1], [36.0, 36.88], [51.0, 51.75], [53.0, 53.7], [54.0, 58.67], [60.0, 62.13], [68.0, 72.82], [74.0, 74.7], [106.0, 108.82], [111.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 77.87, 97.54, 99.59, 0.0, 62.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 1.23, 4.54, 1.19, 1.02, 3.1, 0.88, 0.75, 0.7, 4.67, 2.13, 4.82, 0.7, 2.82, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/urWMTYuDxME_filtered.json b/annotations_filtered/urWMTYuDxME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13be9be192b0a7837257ecbcfb842aa6137486e4 --- /dev/null +++ b/annotations_filtered/urWMTYuDxME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.83], [16.0, 16.82], [18.0, 19.4], [20.0, 23.68], [24.0, 25.86], [27.0, 28.31], [30.0, 32.63], [35.0, 37.69], [39.0, 39.04], [41.0, 42.99], [44.0, 44.66], [45.0, 45.23], [46.0, 51.8], [52.0, 53.42], [55.0, 55.46], [57.0, 57.86], [59.0, 59.49], [61.0, 61.99], [67.0, 67.37], [69.0, 71.86], [73.0, 106.74], [108.0, 108.7], [110.0, 111.28], [112.0, 112.28], [113.0, 114.34], [116.0, 118.08], [119.0, 125.49], [126.0, 127.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.94, 0.0, 0.0, 99.1, 0.0, 0.0, 56.18, 98.19, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 56.18, 83.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.83, 0.82, 1.4, 3.68, 1.86, 1.31, 2.63, 2.69, 0.04, 1.99, 0.66, 0.23, 5.8, 1.42, 0.46, 0.86, 0.49, 0.99, 0.37, 2.86, 33.74, 0.7, 1.28, 0.28, 1.34, 2.08, 6.49, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/urbo6F_qD5k_filtered.json b/annotations_filtered/urbo6F_qD5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1a7f1a06048e87d18356031baf5b0c8ab9b84b --- /dev/null +++ b/annotations_filtered/urbo6F_qD5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.29], [5.0, 5.37], [8.0, 8.65], [10.0, 10.45], [15.0, 16.07], [17.0, 24.12], [25.0, 26.2], [29.0, 29.0], [31.0, 31.01], [35.0, 37.02], [42.0, 71.32], [72.0, 112.45], [117.0, 119.72], [122.0, 122.39], [128.0, 135.01], [137.0, 143.43], [147.0, 148.76], [149.0, 149.17], [149.0, 150.3], [152.0, 153.15]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false], "silence_prob": [76.2, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 29.44, 55.04, 0.0, 33.63, 0.0, 30.02, 29.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 11.72], ["vehicle", 8.82], ["buzz", 6.26]], null, null, [["fly, housefly", 28.12], ["insect", 10.88], ["music", 9.39]], null, [["music", 77.91], ["groan", 3.37], ["speech", 1.54]], [["livestock, farm animals, working animals", 34.27], ["cattle, bovinae", 20.66], ["moo", 8.34]], null, null, null, null], "duration": [2.29, 0.37, 0.65, 0.45, 1.07, 7.12, 1.2, 0.0, 0.01, 2.02, 29.32, 40.45, 2.72, 0.39, 7.01, 6.43, 1.76, 0.17, 1.3, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/urdf4g-LXk4_filtered.json b/annotations_filtered/urdf4g-LXk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84d1b1f08e19e2ec1aa0455fea4947579c0f47db --- /dev/null +++ b/annotations_filtered/urdf4g-LXk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.64], [11.0, 13.15], [14.0, 14.23], [15.0, 14.82], [19.0, 21.37], [25.0, 25.78], [32.0, 33.69], [36.0, 35.83], [39.0, 41.4], [47.0, 47.75], [53.0, 55.24], [61.0, 61.74], [68.0, 67.71], [68.0, 68.34], [68.0, 68.64], [73.0, 74.58], [76.0, 76.38], [79.0, 80.67], [81.0, 83.22], [88.0, 89.21], [95.0, 95.91], [100.0, 101.93], [103.0, 104.28], [106.0, 110.32], [114.0, 117.78], [119.0, 118.91], [125.0, 124.82], [125.0, 126.25], [127.0, 127.53]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 33.06, 0.0, 0.0, 32.17, 0.0, 0.0, 0.0, 33.11, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.32, 0.0, 0.0, 0.0, 0.0, 31.52, 31.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 27.85], ["insect", 24.59], ["bee, wasp, etc.", 8.1]], null, null, [["livestock, farm animals, working animals", 29.94], ["moo", 28.52], ["cattle, bovinae", 23.65]], null, null, null, [["speech", 42.41], ["vehicle", 7.08], ["hubbub, speech noise, speech babble", 5.53]], null, [["livestock, farm animals, working animals", 35.02], ["insect", 18.51], ["cattle, bovinae", 14.83]], null, null, null, null, null, null, null, [["fly, housefly", 55.85], ["insect", 19.88], ["mosquito", 16.19]], null, null, null, null, [["speech", 52.27], ["radio", 13.12], ["sidetone", 3.15]], [["livestock, farm animals, working animals", 28.19], ["speech", 22.22], ["cattle, bovinae", 8.85]], null, null, null, null], "duration": [1.64, 2.15, 0.23, -0.18, 2.37, 0.78, 1.69, -0.17, 2.4, 0.75, 2.24, 0.74, -0.29, 0.34, 0.64, 1.58, 0.38, 1.67, 2.22, 1.21, 0.91, 1.93, 1.28, 4.32, 3.78, -0.09, -0.18, 1.25, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/urnRVr1P2bc_filtered.json b/annotations_filtered/urnRVr1P2bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3e1e5924537cf54436df756c02a4554d82422dc --- /dev/null +++ b/annotations_filtered/urnRVr1P2bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.03], [13.0, 12.9], [13.0, 13.36], [13.0, 13.39], [13.0, 31.26], [32.0, 37.64], [42.0, 62.51], [64.0, 73.04]], "keep_status": [false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.23, 44.26, 44.81, 43.15], "audiomae_on_audioset": [null, null, null, null, [["music", 45.03], ["livestock, farm animals, working animals", 7.46], ["cattle, bovinae", 6.73]], [["music", 50.27], ["wind instrument, woodwind instrument", 6.18], ["synthesizer", 6.06]], [["music", 64.99], ["musical instrument", 3.43], ["brass instrument", 3.11]], [["music", 66.68], ["bleat", 5.04], ["sheep", 4.54]]], "duration": [0.03, -0.1, 0.36, 0.39, 18.26, 5.64, 20.51, 9.04]} \ No newline at end of file diff --git a/annotations_filtered/us54vk5--jM_filtered.json b/annotations_filtered/us54vk5--jM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f37b9ae87972bcc4216719a20e6ccceb83700be --- /dev/null +++ b/annotations_filtered/us54vk5--jM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.69], [36.0, 38.1], [47.0, 49.71], [51.0, 51.44], [61.0, 61.86], [67.0, 67.26], [68.0, 69.18], [74.0, 75.2], [77.0, 77.18], [79.0, 79.57], [81.0, 82.22], [88.0, 90.85], [95.0, 95.01], [96.0, 96.57], [100.0, 100.38], [102.0, 102.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.44, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 2.1, 2.71, 0.44, 0.86, 0.26, 1.18, 1.2, 0.18, 0.57, 1.22, 2.85, 0.01, 0.57, 0.38, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/usWA4j2ED_Q_filtered.json b/annotations_filtered/usWA4j2ED_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72713c4698f601d7e488b4d8138aa4fd88854af1 --- /dev/null +++ b/annotations_filtered/usWA4j2ED_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.53], [13.0, 14.66], [32.0, 32.97], [42.0, 43.14], [81.0, 82.39], [95.0, 95.15], [115.0, 116.61]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.53, 1.66, 0.97, 1.14, 1.39, 0.15, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/us_GLuu2SAc_filtered.json b/annotations_filtered/us_GLuu2SAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dcc0fbac6e3b71ae3c7690282fb8f544b3ae162 --- /dev/null +++ b/annotations_filtered/us_GLuu2SAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.25], [25.0, 46.85], [63.0, 63.29]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.3, 0.0], "audiomae_on_audioset": [null, [["music", 73.16], ["trance music", 3.64], ["electronic music", 2.94]], null], "duration": [0.25, 21.85, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/usmBCn2WxYU_filtered.json b/annotations_filtered/usmBCn2WxYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f18c93ec816edfa7c320353bd5fb429e2ddae5a --- /dev/null +++ b/annotations_filtered/usmBCn2WxYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.33], [22.0, 26.3], [29.0, 31.21], [32.0, 55.49], [59.0, 79.39], [82.0, 110.67], [112.0, 118.61], [121.0, 156.78]], "keep_status": [true, true, true, false, false, false, true, false], "silence_prob": [29.03, 30.02, 30.78, 31.57, 29.86, 29.98, 30.27, 0.0], "audiomae_on_audioset": [[["music", 51.0], ["cacophony", 11.87], ["theremin", 3.93]], [["music", 13.05], ["motorcycle", 10.17], ["vehicle", 9.16]], [["speech", 28.68], ["music", 25.87], ["hum", 11.95]], [["hum", 48.31], ["throbbing", 37.93], ["music", 7.27]], [["music", 44.41], ["throbbing", 32.6], ["hum", 11.17]], [["hum", 58.97], ["mains hum", 10.24], ["music", 9.4]], [["music", 40.34], ["speech", 9.33], ["groan", 3.74]], null], "duration": [4.33, 4.3, 2.21, 23.49, 20.39, 28.67, 6.61, 35.78]} \ No newline at end of file diff --git a/annotations_filtered/utFeHmJ1iUw_filtered.json b/annotations_filtered/utFeHmJ1iUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/utFeHmJ1iUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/utS5IxGpAPI_filtered.json b/annotations_filtered/utS5IxGpAPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09dfdcbc710d06ce03616b333fe8307ca9c3c56a --- /dev/null +++ b/annotations_filtered/utS5IxGpAPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.18], [13.0, 13.31], [16.0, 15.99], [25.0, 28.38], [37.0, 38.03], [42.0, 42.67], [49.0, 50.57], [52.0, 52.52], [55.0, 55.49], [58.0, 58.18], [68.0, 68.1], [73.0, 73.2], [74.0, 75.78], [82.0, 83.88], [85.0, 86.83], [91.0, 92.97], [94.0, 95.71], [98.0, 99.35], [106.0, 108.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.36, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.18, 0.31, -0.01, 3.38, 1.03, 0.67, 1.57, 0.52, 0.49, 0.18, 0.1, 0.2, 1.78, 1.88, 1.83, 1.97, 1.71, 1.35, 2.58]} \ No newline at end of file diff --git a/annotations_filtered/utYsQTUae5w_filtered.json b/annotations_filtered/utYsQTUae5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9cc11580a9c96ce088ed9c89795e701f7f550e8 --- /dev/null +++ b/annotations_filtered/utYsQTUae5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.92], [29.0, 29.05], [43.0, 44.69], [52.0, 53.97], [56.0, 56.32], [63.0, 63.24], [70.0, 72.37], [75.0, 75.22], [80.0, 87.05], [88.0, 88.38], [90.0, 90.56], [93.0, 94.54]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [31.07, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0, 32.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.91], ["whip", 9.61], ["explosion", 7.58]], null, null, null, null, null, [["fart", 32.03], ["speech", 17.77], ["sidetone", 5.2]], null, [["speech", 20.59], ["gunshot, gunfire", 15.64], ["artillery fire", 10.64]], null, null, null], "duration": [2.92, 0.05, 1.69, 1.97, 0.32, 0.24, 2.37, 0.22, 7.05, 0.38, 0.56, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/ut_z2-96X0o_filtered.json b/annotations_filtered/ut_z2-96X0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b422d84f9a6a1662a4383ef7da5c307f623afd0e --- /dev/null +++ b/annotations_filtered/ut_z2-96X0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.01], [17.0, 21.19], [22.0, 28.97], [30.0, 30.45], [31.0, 32.64], [33.0, 36.48], [38.0, 40.34], [41.0, 41.08], [43.0, 42.92], [44.0, 51.0], [52.0, 52.47], [54.0, 53.55], [54.0, 54.33], [55.0, 55.65], [56.0, 57.42], [58.0, 59.73], [61.0, 61.08], [62.0, 63.81], [65.0, 66.93], [68.0, 68.08], [69.0, 69.53], [71.0, 71.31], [72.0, 78.87], [79.0, 79.47], [80.0, 81.31], [82.0, 82.27], [83.0, 83.4], [84.0, 84.59], [85.0, 86.76], [87.0, 90.32], [91.0, 91.71], [93.0, 93.82], [95.0, 96.72], [98.0, 99.4], [101.0, 102.15], [103.0, 103.64], [104.0, 104.62], [105.0, 114.34], [117.0, 118.94], [119.0, 120.33], [121.0, 122.18], [123.0, 125.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.99, 47.58, 100.0, 0.0, 0.0, 81.17, 50.97, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, [["sidetone", 44.79], ["speech", 15.65], ["mains hum", 11.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.01, 4.19, 6.97, 0.45, 1.64, 3.48, 2.34, 0.08, -0.08, 7.0, 0.47, -0.45, 0.33, 0.65, 1.42, 1.73, 0.08, 1.81, 1.93, 0.08, 0.53, 0.31, 6.87, 0.47, 1.31, 0.27, 0.4, 0.59, 1.76, 3.32, 0.71, 0.82, 1.72, 1.4, 1.15, 0.64, 0.62, 9.34, 1.94, 1.33, 1.18, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/uta8BACjLNk_filtered.json b/annotations_filtered/uta8BACjLNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd0f08813a6f03bde74578fb4740dfe90abaf6b --- /dev/null +++ b/annotations_filtered/uta8BACjLNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.62], [7.0, 7.65], [8.0, 9.02], [10.0, 12.82], [14.0, 14.94], [18.0, 19.16], [20.0, 21.34], [23.0, 23.31], [24.0, 24.11], [26.0, 26.13], [35.0, 35.56], [38.0, 39.72], [42.0, 43.19], [45.0, 44.9], [49.0, 49.59], [54.0, 55.07], [56.0, 56.12], [57.0, 59.7], [60.0, 60.49], [61.0, 62.36], [63.0, 64.4], [69.0, 69.55], [72.0, 72.1], [74.0, 74.36], [80.0, 79.64], [84.0, 84.21], [92.0, 92.26], [107.0, 107.08], [110.0, 109.58], [111.0, 111.15], [112.0, 111.91], [113.0, 114.98], [116.0, 117.0], [121.0, 121.73], [122.0, 123.63], [128.0, 129.09], [131.0, 131.82], [134.0, 134.57], [136.0, 139.97], [140.0, 140.75], [144.0, 144.12], [145.0, 146.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.16], ["music", 24.99], ["burst, pop", 5.97]], null, null, null], "duration": [-0.38, 0.65, 1.02, 2.82, 0.94, 1.16, 1.34, 0.31, 0.11, 0.13, 0.56, 1.72, 1.19, -0.1, 0.59, 1.07, 0.12, 2.7, 0.49, 1.36, 1.4, 0.55, 0.1, 0.36, -0.36, 0.21, 0.26, 0.08, -0.42, 0.15, -0.09, 1.98, 1.0, 0.73, 1.63, 1.09, 0.82, 0.57, 3.97, 0.75, 0.12, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/uu-RxCqop98_filtered.json b/annotations_filtered/uu-RxCqop98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..081073e244ede6b0fa6a03294ae5481969cacd56 --- /dev/null +++ b/annotations_filtered/uu-RxCqop98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [8.0, 38.16], [40.0, 42.45], [46.0, 46.8], [49.0, 73.01], [74.0, 80.87], [83.0, 91.77], [94.0, 104.25], [107.0, 108.33]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.97, 0.0, 35.01, 65.67, 63.42, 48.95, 0.0], "audiomae_on_audioset": [null, null, [["music", 44.2], ["mains hum", 20.77], ["hum", 18.01]], null, [["music", 62.08], ["animal", 8.9], ["foghorn", 3.86]], null, null, [["music", 48.51], ["speech", 5.09], ["musical instrument", 4.46]], null], "duration": [1.83, 30.16, 2.45, 0.8, 24.01, 6.87, 8.77, 10.25, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/uu4tB54Uw5I_filtered.json b/annotations_filtered/uu4tB54Uw5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b144bc98b1e2195bb4fe64186abadb8c3e2d1769 --- /dev/null +++ b/annotations_filtered/uu4tB54Uw5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.32], [8.0, 10.74], [11.0, 30.75], [38.0, 38.21], [40.0, 40.14], [42.0, 43.24], [47.0, 49.15], [50.0, 54.95], [56.0, 56.62], [59.0, 61.6], [63.0, 63.71], [65.0, 100.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.46, 50.16, 39.3, 0.0, 0.0, 0.0, 74.29, 63.31, 0.0, 58.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 69.92], ["ambient music", 4.99], ["electronic music", 3.87]], null, null, null, null, null, null, null, null, null], "duration": [2.32, 2.74, 19.75, 0.21, 0.14, 1.24, 2.15, 4.95, 0.62, 2.6, 0.71, 35.95]} \ No newline at end of file diff --git a/annotations_filtered/uuNy1Ibdk_Y_filtered.json b/annotations_filtered/uuNy1Ibdk_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6254876eac6c39709a4fcf476d6366c9798823fe --- /dev/null +++ b/annotations_filtered/uuNy1Ibdk_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [11.0, 10.94], [13.0, 21.93], [25.0, 28.58], [36.0, 36.41], [37.0, 55.29], [58.0, 60.03], [62.0, 63.29], [64.0, 65.04], [68.0, 76.28], [76.0, 76.54], [79.0, 81.73], [83.0, 84.2], [97.0, 97.71], [111.0, 112.82], [125.0, 126.62], [132.0, 133.42], [142.0, 146.75], [155.0, 156.78], [160.0, 159.76]], "keep_status": [false, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.01, 33.65, 0.0, 30.91, 99.85, 0.0, 0.0, 34.29, 0.0, 38.26, 0.0, 0.0, 0.0, 0.0, 0.0, 39.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.35], ["synthesizer", 6.97], ["singing bowl", 5.17]], [["speech", 49.89], ["music", 12.2], ["zipper (clothing)", 6.23]], null, [["music", 48.66], ["electric shaver, electric razor", 11.91], ["speech", 7.92]], null, null, null, [["cattle, bovinae", 15.23], ["livestock, farm animals, working animals", 13.53], ["music", 13.3]], null, [["music", 57.89], ["synthesizer", 6.74], ["drum machine", 6.2]], null, null, null, null, null, [["music", 43.42], ["throbbing", 21.44], ["hum", 18.3]], null, null], "duration": [0.5, -0.06, 8.93, 3.58, 0.41, 18.29, 2.03, 1.29, 1.04, 8.28, 0.54, 2.73, 1.2, 0.71, 1.82, 1.62, 1.42, 4.75, 1.78, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/uuTeJ6tbyB4_filtered.json b/annotations_filtered/uuTeJ6tbyB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7cdc8a2c685ce73df6f2de28bf817e592acfd65 --- /dev/null +++ b/annotations_filtered/uuTeJ6tbyB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 65.94], [67.0, 69.13], [70.0, 72.03], [74.0, 75.78], [105.0, 105.33], [108.0, 109.56], [111.0, 111.37], [113.0, 113.07], [114.0, 120.02], [122.0, 126.59], [127.0, 129.59], [131.0, 131.46], [135.0, 135.57], [137.0, 137.71], [141.0, 141.96], [143.0, 144.02], [146.0, 146.94], [151.0, 152.91], [155.0, 155.9], [157.0, 157.25], [158.0, 158.92], [160.0, 161.22], [167.0, 167.31], [168.0, 168.44]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.94, 40.29, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["echo", 20.81], ["music", 12.6], ["synthesizer", 7.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [32.94, 2.13, 2.03, 1.78, 0.33, 1.56, 0.37, 0.07, 6.02, 4.59, 2.59, 0.46, 0.57, 0.71, 0.96, 1.02, 0.94, 1.91, 0.9, 0.25, 0.92, 1.22, 0.31, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/uuWIaDATbnE_filtered.json b/annotations_filtered/uuWIaDATbnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce7ce40a9bd8ec714fc6d5ec6b63b4717269ee --- /dev/null +++ b/annotations_filtered/uuWIaDATbnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.69], [10.0, 12.24], [30.0, 30.84], [35.0, 35.04], [54.0, 54.51], [55.0, 56.22], [57.0, 57.33], [59.0, 59.39], [66.0, 67.59], [83.0, 83.29], [89.0, 89.87], [105.0, 106.14], [107.0, 113.64], [114.0, 116.75], [124.0, 124.48], [129.0, 130.08]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4, 31.09, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.58], ["throbbing", 23.81], ["hum", 5.82]], null, null, null, null, null, null, null, null, null, null, [["music", 46.56], ["speech", 25.24], ["frog", 2.86]], [["moo", 41.93], ["cattle, bovinae", 38.16], ["livestock, farm animals, working animals", 13.49]], null, null], "duration": [-0.31, 2.24, 0.84, 0.04, 0.51, 1.22, 0.33, 0.39, 1.59, 0.29, 0.87, 1.14, 6.64, 2.75, 0.48, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/uuYTVl0iOkk_filtered.json b/annotations_filtered/uuYTVl0iOkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58835fc386483298a15f2186827ccf0352a85d4a --- /dev/null +++ b/annotations_filtered/uuYTVl0iOkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.82], [21.0, 21.44], [23.0, 22.94], [25.0, 25.93], [30.0, 32.59], [35.0, 38.96], [39.0, 39.61], [41.0, 41.89], [42.0, 44.51], [47.0, 47.38], [48.0, 49.32], [51.0, 56.4], [59.0, 59.78], [61.0, 61.42], [62.0, 62.4], [63.0, 66.24], [69.0, 71.83], [82.0, 82.48]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 82.97, 55.18, 0.0, 0.0, 38.58, 0.0, 0.0, 35.37, 0.0, 0.0, 0.0, 37.62, 35.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 22.44], ["mosquito", 22.08], ["insect", 9.35]], null, null, [["hum", 24.68], ["sidetone", 18.39], ["noise", 12.33]], null, null, null, [["electric shaver, electric razor", 19.42], ["mains hum", 17.63], ["hum", 8.43]], [["frog", 26.5], ["animal", 20.87], ["roar", 9.09]], null], "duration": [1.82, 0.44, -0.06, 0.93, 2.59, 3.96, 0.61, 0.89, 2.51, 0.38, 1.32, 5.4, 0.78, 0.42, 0.4, 3.24, 2.83, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/uvAd-GbYBVw_filtered.json b/annotations_filtered/uvAd-GbYBVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbcd746f16e09599be9e8c6cfb14bb124a0c8b2c --- /dev/null +++ b/annotations_filtered/uvAd-GbYBVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.92], [16.0, 36.86], [38.0, 38.92], [40.0, 40.69], [42.0, 59.81], [63.0, 64.62], [72.0, 76.72], [79.0, 80.7], [93.0, 93.16], [96.0, 95.89], [107.0, 119.37], [123.0, 130.06], [131.0, 133.29], [139.0, 143.63], [145.0, 147.34], [148.0, 151.36], [154.0, 169.96], [171.0, 173.79]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, true, false, false, true, false, true], "silence_prob": [38.1, 36.89, 0.0, 0.0, 42.22, 0.0, 36.94, 0.0, 0.0, 0.0, 29.45, 29.88, 43.45, 59.77, 72.9, 29.57, 55.46, 47.78], "audiomae_on_audioset": [[["music", 24.79], ["hum", 22.52], ["speech", 11.02]], [["hum", 28.94], ["mains hum", 28.55], ["speech", 16.26]], null, null, [["speech", 38.83], ["music", 12.35], ["hum", 10.5]], null, [["speech", 47.32], ["music", 21.89], ["hum", 6.09]], null, null, null, [["music", 33.21], ["speech", 30.75], ["boing", 5.37]], [["music", 52.48], ["speech", 20.01], ["throbbing", 9.15]], [["music", 13.75], ["moo", 12.42], ["hum", 11.59]], null, null, [["groan", 12.36], ["whack, thwack", 11.26], ["cattle, bovinae", 7.83]], null, [["speech", 14.61], ["music", 9.68], ["sine wave", 5.75]]], "duration": [6.92, 20.86, 0.92, 0.69, 17.81, 1.62, 4.72, 1.7, 0.16, -0.11, 12.37, 7.06, 2.29, 4.63, 2.34, 3.36, 15.96, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/uvFc0EPRSI4_filtered.json b/annotations_filtered/uvFc0EPRSI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ad77d44036fd378f2489518844a9a7284ebbf0a --- /dev/null +++ b/annotations_filtered/uvFc0EPRSI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.39], [16.0, 21.51], [22.0, 21.9], [27.0, 27.45], [28.0, 28.68], [29.0, 29.88], [31.0, 39.6], [45.0, 46.87], [48.0, 57.52], [65.0, 65.5], [66.0, 65.7], [67.0, 80.99], [86.0, 91.47], [96.0, 106.2], [108.0, 119.23], [121.0, 123.33]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.77, 0.0, 0.0, 0.0, 0.0, 32.58, 0.0, 32.02, 0.0, 0.0, 32.87, 34.71, 32.34, 33.53, 37.91], "audiomae_on_audioset": [null, [["music", 34.16], ["cacophony", 19.12], ["speech", 6.48]], null, null, null, null, [["speech", 35.11], ["music", 34.47], ["musical instrument", 4.63]], null, [["speech", 31.29], ["sidetone", 27.17], ["music", 19.7]], null, null, [["music", 48.3], ["speech", 26.44], ["cacophony", 5.51]], [["music", 64.68], ["throbbing", 7.54], ["hum", 6.36]], [["music", 79.89], ["speech", 7.41], ["hum", 1.61]], [["speech", 55.63], ["music", 30.76], ["explosion", 2.65]], [["speech", 46.02], ["music", 11.74], ["crowd", 5.86]]], "duration": [0.39, 5.51, -0.1, 0.45, 0.68, 0.88, 8.6, 1.87, 9.52, 0.5, -0.3, 13.99, 5.47, 10.2, 11.23, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/uvIZ4ST6HqE_filtered.json b/annotations_filtered/uvIZ4ST6HqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68685eb0d878d481e37cf1b40682ec81669092b5 --- /dev/null +++ b/annotations_filtered/uvIZ4ST6HqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.85], [17.0, 19.28], [21.0, 21.47], [22.0, 22.22], [28.0, 30.37], [37.0, 38.7], [40.0, 40.98], [41.0, 41.59], [56.0, 56.84], [60.0, 62.61], [65.0, 66.01], [78.0, 78.16], [90.0, 91.34], [92.0, 93.23], [94.0, 93.97], [98.0, 99.13], [102.0, 103.27], [110.0, 109.93], [116.0, 117.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.13, 99.76, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.85, 2.28, 0.47, 0.22, 2.37, 1.7, 0.98, 0.59, 0.84, 2.61, 1.01, 0.16, 1.34, 1.23, -0.03, 1.13, 1.27, -0.07, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/uvPjPzmUC7w_filtered.json b/annotations_filtered/uvPjPzmUC7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c04a29713f230bbfa2b0098b24dcd8cee988d693 --- /dev/null +++ b/annotations_filtered/uvPjPzmUC7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 19.68], [21.0, 23.14], [25.0, 25.3], [34.0, 34.42], [41.0, 42.6], [43.0, 44.1], [49.0, 53.49]], "keep_status": [false, true, false, false, false, false, true], "silence_prob": [29.38, 32.1, 0.0, 0.0, 0.0, 0.0, 31.78], "audiomae_on_audioset": [[["music", 58.44], ["theremin", 8.02], ["buzz", 5.97]], [["music", 31.46], ["throbbing", 15.79], ["hum", 8.72]], null, null, null, null, [["music", 38.44], ["musical instrument", 10.43], ["guitar", 8.74]]], "duration": [12.68, 2.14, 0.3, 0.42, 1.6, 1.1, 4.49]} \ No newline at end of file diff --git a/annotations_filtered/uvQFoM1fj0E_filtered.json b/annotations_filtered/uvQFoM1fj0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f49060a26506f08a338271901f2eb096b1641592 --- /dev/null +++ b/annotations_filtered/uvQFoM1fj0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.03], [14.0, 16.97], [25.0, 26.22], [28.0, 30.62], [34.0, 35.7], [39.0, 41.03], [48.0, 49.08], [52.0, 53.5], [61.0, 62.36], [68.0, 69.67], [71.0, 70.82], [73.0, 74.38], [75.0, 82.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 2.97, 1.22, 2.62, 1.7, 2.03, 1.08, 1.5, 1.36, 1.67, -0.18, 1.38, 7.98]} \ No newline at end of file diff --git a/annotations_filtered/uvUH_niF-Zo_filtered.json b/annotations_filtered/uvUH_niF-Zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4f64a8b6255e80f892db56933bc959cfafbf845 --- /dev/null +++ b/annotations_filtered/uvUH_niF-Zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [17.0, 19.2], [22.0, 32.91], [33.0, 41.77], [43.0, 43.44], [44.0, 44.63], [49.0, 50.03], [51.0, 51.9], [52.0, 52.89], [57.0, 57.92], [61.0, 63.04], [63.0, 66.28], [71.0, 71.37], [74.0, 82.21], [84.0, 85.94], [90.0, 93.02], [95.0, 100.3], [102.0, 106.64], [109.0, 109.61], [110.0, 113.59], [115.0, 118.71]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.0, 53.91, 39.21, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 43.64, 0.0, 53.47, 0.0, 95.37, 98.1, 97.0, 0.0, 66.63, 84.43], "audiomae_on_audioset": [null, null, [["thunk", 33.11], ["fly, housefly", 14.45], ["insect", 7.87]], null, null, null, null, null, null, null, null, [["speech", 39.12], ["sidetone", 34.23], ["chirp tone", 2.79]], null, null, null, null, null, null, null, null, null], "duration": [2.86, 2.2, 10.91, 8.77, 0.44, 0.63, 1.03, 0.9, 0.89, 0.92, 2.04, 3.28, 0.37, 8.21, 1.94, 3.02, 5.3, 4.64, 0.61, 3.59, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/uvXwt5HNFLU_filtered.json b/annotations_filtered/uvXwt5HNFLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aeda9470ca4910317c952b09b4db89d96e67afa --- /dev/null +++ b/annotations_filtered/uvXwt5HNFLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [3.0, 3.16], [4.0, 4.36], [9.0, 9.68], [11.0, 13.56], [19.0, 19.99], [24.0, 25.37], [26.0, 26.59], [27.0, 28.43], [31.0, 31.11], [32.0, 34.42], [35.0, 36.71], [37.0, 38.91], [40.0, 41.84], [43.0, 43.78], [44.0, 44.59], [47.0, 48.78], [51.0, 52.03], [53.0, 57.3], [58.0, 60.54], [62.0, 64.0], [70.0, 70.17], [72.0, 72.57], [74.0, 74.44], [75.0, 75.96], [80.0, 81.6], [84.0, 85.14], [90.0, 90.66], [94.0, 100.55], [105.0, 108.72], [114.0, 114.05], [115.0, 115.96], [118.0, 118.44], [119.0, 120.16], [121.0, 121.32], [122.0, 123.97], [134.0, 135.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 45.36, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.62, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.94], ["telephone", 24.96], ["sidetone", 13.91]], null, null, null, null, null, null, null, null, [["music", 45.88], ["noise", 6.74], ["synthesizer", 4.54]], [["tuning fork", 17.86], ["speech", 11.97], ["boing", 11.08]], null, null, null, null, null, null, null], "duration": [0.12, 0.16, 0.36, 0.68, 2.56, 0.99, 1.37, 0.59, 1.43, 0.11, 2.42, 1.71, 1.91, 1.84, 0.78, 0.59, 1.78, 1.03, 4.3, 2.54, 2.0, 0.17, 0.57, 0.44, 0.96, 1.6, 1.14, 0.66, 6.55, 3.72, 0.05, 0.96, 0.44, 1.16, 0.32, 1.97, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/uvZImlL51Io_filtered.json b/annotations_filtered/uvZImlL51Io_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b1ebbdcc1de9abd3519ebf2d56af2941da073c3 --- /dev/null +++ b/annotations_filtered/uvZImlL51Io_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.41], [23.0, 23.45], [23.0, 23.52], [24.0, 87.12], [92.0, 104.33], [105.0, 108.26], [109.0, 109.85], [111.0, 111.89]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.51, 32.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 29.87], ["hum", 29.43], ["music", 19.51]], [["speech", 53.04], ["cacophony", 7.31], ["vehicle", 6.84]], null, null], "duration": [0.41, 0.45, 0.52, 63.12, 12.33, 3.26, 0.85, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/uw63_YyNsF4_filtered.json b/annotations_filtered/uw63_YyNsF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..962afa414d6caeda945ab02d1d194197c6e1598e --- /dev/null +++ b/annotations_filtered/uw63_YyNsF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 3.86], [5.0, 5.66], [8.0, 8.29], [9.0, 9.51], [11.0, 11.77], [13.0, 13.32], [24.0, 24.9], [28.0, 29.81], [31.0, 31.41], [36.0, 36.02], [38.0, 38.69], [43.0, 43.83], [46.0, 46.04], [48.0, 48.2], [53.0, 54.46], [55.0, 59.04], [60.0, 60.1], [68.0, 68.32], [71.0, 71.73], [72.0, 72.71], [76.0, 77.23], [78.0, 78.63], [79.0, 79.73], [83.0, 83.69], [86.0, 87.05], [88.0, 88.65], [91.0, 91.66], [94.0, 94.47], [96.0, 96.53], [102.0, 101.82], [104.0, 103.77], [106.0, 106.59], [111.0, 110.76], [111.0, 111.75], [113.0, 113.53], [117.0, 117.05], [118.0, 117.96], [118.0, 118.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, -0.14, 0.66, 0.29, 0.51, 0.77, 0.32, 0.9, 1.81, 0.41, 0.02, 0.69, 0.83, 0.04, 0.2, 1.46, 4.04, 0.1, 0.32, 0.73, 0.71, 1.23, 0.63, 0.73, 0.69, 1.05, 0.65, 0.66, 0.47, 0.53, -0.18, -0.23, 0.59, -0.24, 0.75, 0.53, 0.05, -0.04, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/uw7rRlJvEl4_filtered.json b/annotations_filtered/uw7rRlJvEl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019e84a80931fbf5fe992dd0e5be4f0d4d3ad498 --- /dev/null +++ b/annotations_filtered/uw7rRlJvEl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 91.39]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [62.39]} \ No newline at end of file diff --git a/annotations_filtered/uwV4iMoc7xg_filtered.json b/annotations_filtered/uwV4iMoc7xg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..458cb1e961dd054f786b47c5dce8f61bd5b8049d --- /dev/null +++ b/annotations_filtered/uwV4iMoc7xg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.99], [10.0, 15.75], [17.0, 21.27], [23.0, 26.1], [27.0, 27.62], [29.0, 29.84], [31.0, 33.2], [37.0, 38.3], [39.0, 42.23], [43.0, 44.1], [45.0, 46.16], [48.0, 48.84], [50.0, 52.03]], "keep_status": [true, true, true, true, false, false, false, false, true, false, false, false, true], "silence_prob": [43.38, 44.15, 45.18, 45.72, 0.0, 0.0, 52.05, 0.0, 43.03, 0.0, 0.0, 0.0, 41.1], "audiomae_on_audioset": [[["hum", 24.21], ["throbbing", 20.33], ["music", 11.66]], [["hum", 16.61], ["music", 15.34], ["throbbing", 11.33]], [["wind chime", 17.45], ["speech", 12.47], ["chime", 8.17]], [["wind chime", 23.91], ["chime", 9.65], ["vehicle", 7.96]], null, null, null, null, [["wind chime", 30.83], ["chime", 20.08], ["noise", 5.44]], null, null, null, [["whale vocalization", 31.07], ["hum", 13.23], ["mains hum", 5.11]]], "duration": [5.99, 5.75, 4.27, 3.1, 0.62, 0.84, 2.2, 1.3, 3.23, 1.1, 1.16, 0.84, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/uwcJaUaVfR0_filtered.json b/annotations_filtered/uwcJaUaVfR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83036fbe415ed66287218f97c12b9db2987b2a02 --- /dev/null +++ b/annotations_filtered/uwcJaUaVfR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.49], [8.0, 9.15], [12.0, 12.8], [14.0, 15.13], [17.0, 16.71], [20.0, 20.39], [21.0, 22.35], [31.0, 31.65], [36.0, 37.52], [42.0, 42.42], [44.0, 45.25], [51.0, 53.25], [58.0, 61.16], [62.0, 62.5], [63.0, 74.38], [77.0, 77.72], [81.0, 82.53], [84.0, 84.45], [87.0, 88.5], [95.0, 95.77], [101.0, 104.21], [106.0, 107.49], [110.0, 110.4], [111.0, 111.62], [116.0, 116.46], [119.0, 119.55], [121.0, 121.46], [124.0, 125.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [43.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.78, 36.9, 0.0, 41.01, 0.0, 0.0, 0.0, 0.0, 0.0, 37.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.38], ["electronic music", 9.24], ["throbbing", 8.13]], null, null, null, null, null, null, null, null, null, null, [["music", 12.19], ["gong", 8.81], ["didgeridoo", 7.55]], [["speech", 46.24], ["rumble", 10.06], ["whale vocalization", 6.32]], null, [["rumble", 40.24], ["hum", 10.7], ["buzz", 9.81]], null, null, null, null, null, [["music", 22.23], ["ambient music", 13.49], ["hum", 13.04]], null, null, null, null, null, null, null], "duration": [2.49, 1.15, 0.8, 1.13, -0.29, 0.39, 1.35, 0.65, 1.52, 0.42, 1.25, 2.25, 3.16, 0.5, 11.38, 0.72, 1.53, 0.45, 1.5, 0.77, 3.21, 1.49, 0.4, 0.62, 0.46, 0.55, 0.46, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/ux9JHznPT8E_filtered.json b/annotations_filtered/ux9JHznPT8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03cd94e2f5e6d5fd728216229580a0e8c849ea57 --- /dev/null +++ b/annotations_filtered/ux9JHznPT8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [6.0, 6.89], [8.0, 8.13], [10.0, 11.1], [13.0, 13.63], [15.0, 27.97], [29.0, 29.19], [31.0, 32.58], [35.0, 35.92], [38.0, 38.58], [42.0, 43.07], [45.0, 45.18], [46.0, 47.06], [48.0, 49.52], [56.0, 73.92], [78.0, 88.32], [91.0, 118.79], [121.0, 121.46], [124.0, 124.66], [128.0, 128.82], [135.0, 135.89], [137.0, 138.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.34, 56.86, 50.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.89, 0.13, 1.1, 0.63, 12.97, 0.19, 1.58, 0.92, 0.58, 1.07, 0.18, 1.06, 1.52, 17.92, 10.32, 27.79, 0.46, 0.66, 0.82, 0.89, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/uxXMshs5exs_filtered.json b/annotations_filtered/uxXMshs5exs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09bf460fcf086d3df8f52a0b58cd5136bdd033e4 --- /dev/null +++ b/annotations_filtered/uxXMshs5exs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.9], [9.0, 9.56], [19.0, 19.72], [41.0, 40.91], [48.0, 48.37], [52.0, 52.79], [54.0, 55.38], [56.0, 57.7], [63.0, 62.82], [67.0, 67.39], [85.0, 85.85], [107.0, 107.5], [118.0, 117.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 0.56, 0.72, -0.09, 0.37, 0.79, 1.38, 1.7, -0.18, 0.39, 0.85, 0.5, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/uxhJ_E3LuNA_filtered.json b/annotations_filtered/uxhJ_E3LuNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef16c502e85dfcff4262213118bcba47eecdddc0 --- /dev/null +++ b/annotations_filtered/uxhJ_E3LuNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [4.0, 5.56], [9.0, 11.15], [11.0, 16.29], [19.0, 20.44], [21.0, 22.0], [23.0, 23.63], [27.0, 29.24], [30.0, 31.38], [32.0, 32.9], [34.0, 34.06], [34.0, 35.99], [37.0, 37.89], [42.0, 43.21], [45.0, 45.99], [46.0, 46.87], [48.0, 51.49], [54.0, 58.21], [59.0, 59.53], [62.0, 64.61], [65.0, 70.23], [77.0, 77.67], [78.0, 80.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.78, 91.98, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 92.15, 0.0, 100.0, 57.09, 0.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 1.56, 2.15, 5.29, 1.44, 1.0, 0.63, 2.24, 1.38, 0.9, 0.06, 1.99, 0.89, 1.21, 0.99, 0.87, 3.49, 4.21, 0.53, 2.61, 5.23, 0.67, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/uxj3cKArYDI_filtered.json b/annotations_filtered/uxj3cKArYDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..173feb9020126aa72fc2378333d78d411e9eea40 --- /dev/null +++ b/annotations_filtered/uxj3cKArYDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [6.0, 6.25], [17.0, 17.91], [36.0, 36.49], [39.0, 40.07], [41.0, 41.79], [43.0, 43.48], [48.0, 50.18], [54.0, 54.23], [58.0, 58.63], [90.0, 90.76], [109.0, 109.97], [115.0, 116.6], [120.0, 120.23], [127.0, 127.28], [131.0, 131.28], [137.0, 137.0], [194.0, 194.22], [204.0, 204.75], [225.0, 226.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 29.22], ["speech", 25.06], ["hum", 22.04]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.25, 0.91, 0.49, 1.07, 0.79, 0.48, 2.18, 0.23, 0.63, 0.76, 0.97, 1.6, 0.23, 0.28, 0.28, 0.0, 0.22, 0.75, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/uxvN1tNASYo_filtered.json b/annotations_filtered/uxvN1tNASYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f97b3b242aeee1dbf553be2ffa3b938875b4b94 --- /dev/null +++ b/annotations_filtered/uxvN1tNASYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [8.0, 8.18], [8.0, 12.8], [15.0, 23.36], [66.0, 73.94], [75.0, 74.95], [75.0, 77.99], [80.0, 91.13], [101.0, 102.29], [104.0, 116.6], [118.0, 119.06], [120.0, 124.53]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 30.09, 28.87, 29.93, 0.0, 29.78, 30.39, 0.0, 30.16, 0.0, 98.8], "audiomae_on_audioset": [null, null, [["music", 73.64], ["speech", 4.69], ["drum machine", 1.93]], [["music", 62.87], ["speech", 15.04], ["musical instrument", 4.43]], [["music", 82.96], ["speech", 3.9], ["throbbing", 1.61]], null, [["music", 83.79], ["speech", 2.15], ["crowd", 0.78]], [["music", 64.7], ["speech", 4.61], ["synthesizer", 3.15]], null, [["music", 57.73], ["theremin", 8.41], ["musical instrument", 2.68]], null, null], "duration": [0.14, 0.18, 4.8, 8.36, 7.94, -0.05, 2.99, 11.13, 1.29, 12.6, 1.06, 4.53]} \ No newline at end of file diff --git a/annotations_filtered/uy4F1IeShVA_filtered.json b/annotations_filtered/uy4F1IeShVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43ef0a7152129523def8affaf7a7101240636b66 --- /dev/null +++ b/annotations_filtered/uy4F1IeShVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.49], [20.0, 24.83], [25.0, 41.79], [42.0, 83.17], [83.0, 83.49], [85.0, 86.21], [87.0, 116.18], [116.0, 118.64], [122.0, 122.99], [124.0, 124.26], [127.0, 127.14]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false], "silence_prob": [40.88, 39.35, 39.49, 0.0, 0.0, 0.0, 37.84, 59.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.54], ["theremin", 13.44], ["hum", 5.34]], [["music", 60.81], ["throbbing", 4.57], ["didgeridoo", 3.91]], [["music", 27.87], ["speech", 20.15], ["sidetone", 7.27]], null, null, null, [["music", 34.37], ["speech", 27.32], ["sidetone", 8.26]], null, null, null, null], "duration": [4.49, 4.83, 16.79, 41.17, 0.49, 1.21, 29.18, 2.64, 0.99, 0.26, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/uy8_ARH8yyM_filtered.json b/annotations_filtered/uy8_ARH8yyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26e20f196e6738ec97047de67ae1fe31fb991ac4 --- /dev/null +++ b/annotations_filtered/uy8_ARH8yyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.28], [7.0, 7.55], [27.0, 26.72], [29.0, 29.62], [37.0, 37.56], [49.0, 49.86], [56.0, 55.7], [58.0, 58.6], [63.0, 63.37], [63.0, 63.49], [70.0, 70.92], [76.0, 75.81], [79.0, 79.51], [81.0, 82.65], [83.0, 89.24], [96.0, 96.25], [101.0, 101.41], [103.0, 103.42], [105.0, 105.34], [110.0, 110.42], [115.0, 114.89], [116.0, 116.77], [117.0, 117.59], [120.0, 122.34], [125.0, 125.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.55, -0.28, 0.62, 0.56, 0.86, -0.3, 0.6, 0.37, 0.49, 0.92, -0.19, 0.51, 1.65, 6.24, 0.25, 0.41, 0.42, 0.34, 0.42, -0.11, 0.77, 0.59, 2.34, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/uySQvxQHbdI_filtered.json b/annotations_filtered/uySQvxQHbdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af08e8be0b4c3e0afdc4338e991e1e8d7970f9b --- /dev/null +++ b/annotations_filtered/uySQvxQHbdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.19], [27.0, 61.21]], "keep_status": [true, false], "silence_prob": [32.08, 0.0], "audiomae_on_audioset": [[["speech", 52.83], ["music", 12.96], ["hum", 4.16]], null], "duration": [19.19, 34.21]} \ No newline at end of file diff --git a/annotations_filtered/uy_2GCNyzgk_filtered.json b/annotations_filtered/uy_2GCNyzgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e67ee8570a166f603b518ac3e8e6659983545acc --- /dev/null +++ b/annotations_filtered/uy_2GCNyzgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [8.0, 9.49], [12.0, 12.58], [17.0, 18.66], [28.0, 28.92], [42.0, 43.75], [102.0, 108.58], [110.0, 111.01]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.37, 1.49, 0.58, 1.66, 0.92, 1.75, 6.58, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/uydWF18xoCQ_filtered.json b/annotations_filtered/uydWF18xoCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..028e4e57668a5c3b73ad3518d285e964d3fec46d --- /dev/null +++ b/annotations_filtered/uydWF18xoCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.64], [9.0, 57.62], [60.0, 59.59], [62.0, 64.5], [70.0, 71.93], [73.0, 74.63], [76.0, 78.93], [80.0, 84.6], [86.0, 97.7], [99.0, 114.78]], "keep_status": [false, false, false, true, false, false, false, false, false, true], "silence_prob": [32.98, 0.0, 0.0, 32.64, 0.0, 0.0, 52.74, 45.33, 30.59, 29.43], "audiomae_on_audioset": [[["music", 64.28], ["theremin", 9.83], ["musical instrument", 3.54]], null, null, [["music", 50.95], ["gong", 13.83], ["synthesizer", 4.87]], null, null, null, [["music", 67.56], ["percussion", 4.47], ["drum", 4.05]], [["music", 57.92], ["hum", 16.25], ["throbbing", 8.2]], [["hum", 25.7], ["throbbing", 21.52], ["music", 21.23]]], "duration": [4.64, 48.62, -0.41, 2.5, 1.93, 1.63, 2.93, 4.6, 11.7, 15.78]} \ No newline at end of file diff --git a/annotations_filtered/uyfrK4LrXaQ_filtered.json b/annotations_filtered/uyfrK4LrXaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..951c75f5f44a622cb85e01c18b893ac1e91149c6 --- /dev/null +++ b/annotations_filtered/uyfrK4LrXaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 11.03], [13.0, 15.53], [16.0, 15.62], [17.0, 17.31], [20.0, 29.93], [30.0, 30.03], [30.0, 30.28], [30.0, 44.63], [45.0, 46.63], [48.0, 53.7], [55.0, 56.05], [56.0, 120.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 99.82, 0.0, 0.0, 99.65, 0.0, 0.0, 96.54, 0.0, 93.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 6.03, 2.53, -0.38, 0.31, 9.93, 0.03, 0.28, 14.63, 1.63, 5.7, 1.05, 64.39]} \ No newline at end of file diff --git a/annotations_filtered/uyj1CeZt23A_filtered.json b/annotations_filtered/uyj1CeZt23A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f593f181246537e51f782a1c34fd113374c38301 --- /dev/null +++ b/annotations_filtered/uyj1CeZt23A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.43], [8.0, 10.35], [14.0, 14.47], [15.0, 15.8], [17.0, 21.44], [24.0, 24.11], [25.0, 26.1], [28.0, 29.1], [30.0, 30.13], [31.0, 31.24], [32.0, 35.68], [37.0, 37.54], [41.0, 40.76], [43.0, 43.23], [48.0, 48.27], [49.0, 49.92], [51.0, 53.69], [54.0, 55.21], [60.0, 60.88], [69.0, 69.96], [71.0, 72.55], [74.0, 75.22], [80.0, 84.13]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.52, 61.57, 0.0, 0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16], "audiomae_on_audioset": [[["speech", 61.07], ["music", 5.42], ["animal", 2.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 2.35, 0.47, 0.8, 4.44, 0.11, 1.1, 1.1, 0.13, 0.24, 3.68, 0.54, -0.24, 0.23, 0.27, 0.92, 2.69, 1.21, 0.88, 0.96, 1.55, 1.22, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/uykR8csyO-w_filtered.json b/annotations_filtered/uykR8csyO-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b98b8fd1b105e76109792c789b6d40da5923dc --- /dev/null +++ b/annotations_filtered/uykR8csyO-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.8], [15.0, 37.69], [40.0, 43.88]], "keep_status": [false, false, false], "silence_prob": [35.33, 34.45, 34.54], "audiomae_on_audioset": [[["music", 54.09], ["theremin", 23.19], ["trombone", 4.21]], [["theremin", 43.15], ["music", 29.1], ["musical instrument", 6.01]], [["moo", 39.78], ["cattle, bovinae", 27.47], ["livestock, farm animals, working animals", 7.9]]], "duration": [5.8, 22.69, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/uzHwlt3dmmo_filtered.json b/annotations_filtered/uzHwlt3dmmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..681a2f8c3c2f33f2eb1af556d688835dea8b1d4e --- /dev/null +++ b/annotations_filtered/uzHwlt3dmmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.73], [1.0, 19.94], [21.0, 22.2], [24.0, 49.86], [53.0, 69.62], [72.0, 75.63], [76.0, 77.31], [78.0, 79.44], [81.0, 88.59], [92.0, 120.28], [124.0, 130.3], [133.0, 133.89]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.6, 0.0, 31.92, 32.8, 31.52, 0.0, 0.0, 31.55, 30.85, 33.38, 0.0], "audiomae_on_audioset": [null, [["music", 42.95], ["throbbing", 39.58], ["hum", 10.28]], null, [["music", 35.59], ["hum", 19.49], ["throbbing", 14.92]], [["music", 70.32], ["hum", 7.65], ["throbbing", 7.13]], [["music", 61.6], ["throbbing", 11.41], ["hum", 3.86]], null, null, [["music", 51.11], ["throbbing", 17.32], ["hum", 11.53]], [["music", 56.7], ["hum", 18.64], ["throbbing", 8.41]], [["music", 72.63], ["hum", 6.22], ["synthesizer", 4.49]], null], "duration": [-0.27, 18.94, 1.2, 25.86, 16.62, 3.63, 1.31, 1.44, 7.59, 28.28, 6.3, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/uzIEsj6Me9g_filtered.json b/annotations_filtered/uzIEsj6Me9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/uzIEsj6Me9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/uzMEc37DGZA_filtered.json b/annotations_filtered/uzMEc37DGZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e78a72f69abb97bfd4074b0935770354c9ae1a5 --- /dev/null +++ b/annotations_filtered/uzMEc37DGZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.2], [7.0, 7.21], [11.0, 11.35], [14.0, 14.03], [17.0, 16.68], [21.0, 20.95], [25.0, 25.41], [30.0, 30.23], [31.0, 31.65], [40.0, 40.59], [43.0, 43.46], [44.0, 44.79], [47.0, 48.52], [54.0, 56.71], [57.0, 60.44], [65.0, 65.74], [67.0, 66.7], [68.0, 68.39], [69.0, 70.29], [72.0, 72.98], [76.0, 76.47], [78.0, 78.71], [81.0, 80.89], [83.0, 83.64], [89.0, 89.48], [90.0, 90.61], [100.0, 100.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 51.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 0.21, 0.35, 0.03, -0.32, -0.05, 0.41, 0.23, 0.65, 0.59, 0.46, 0.79, 1.52, 2.71, 3.44, 0.74, -0.3, 0.39, 1.29, 0.98, 0.47, 0.71, -0.11, 0.64, 0.48, 0.61, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/uzTuGHYRJ9w_filtered.json b/annotations_filtered/uzTuGHYRJ9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..818399577e7ac8fca2823bf145f1304cd6924291 --- /dev/null +++ b/annotations_filtered/uzTuGHYRJ9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.82], [10.0, 10.25], [11.0, 12.38], [21.0, 21.69], [25.0, 25.81], [29.0, 48.14], [50.0, 59.05], [60.0, 60.66], [63.0, 62.94], [68.0, 68.03], [71.0, 72.18], [74.0, 74.88], [84.0, 84.89], [87.0, 89.34], [107.0, 133.22], [142.0, 143.5], [152.0, 152.9], [154.0, 157.99], [160.0, 161.69], [163.0, 163.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [38.93, 0.0, 0.0, 0.0, 0.0, 38.54, 28.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.11, 30.1, 0.0, 0.0, 38.75, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.6], ["theremin", 10.63], ["synthesizer", 9.49]], null, null, null, null, [["music", 52.08], ["synthesizer", 17.36], ["electronic music", 4.89]], [["music", 42.68], ["speech", 28.43], ["musical instrument", 4.83]], null, null, null, null, null, null, [["speech", 23.83], ["fart", 23.15], ["laughter", 12.63]], [["music", 18.68], ["fly, housefly", 18.56], ["fart", 13.06]], null, null, [["speech", 56.13], ["whack, thwack", 9.67], ["thunk", 5.66]], null, null], "duration": [2.82, 0.25, 1.38, 0.69, 0.81, 19.14, 9.05, 0.66, -0.06, 0.03, 1.18, 0.88, 0.89, 2.34, 26.22, 1.5, 0.9, 3.99, 1.69, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/uzeSNmjxyNg_filtered.json b/annotations_filtered/uzeSNmjxyNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0a8e2ec7f54cdc72e35da84069020fb15b5898b --- /dev/null +++ b/annotations_filtered/uzeSNmjxyNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.63], [7.0, 7.43], [9.0, 12.97], [14.0, 14.84], [16.0, 16.06], [23.0, 23.03], [24.0, 23.84], [26.0, 29.22], [30.0, 30.86], [31.0, 59.44], [61.0, 83.86]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [40.84, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 46.94, 0.0, 29.69, 29.72], "audiomae_on_audioset": [[["cattle, bovinae", 32.09], ["moo", 25.71], ["livestock, farm animals, working animals", 16.02]], null, null, null, null, null, null, [["moo", 16.3], ["cattle, bovinae", 9.69], ["livestock, farm animals, working animals", 9.48]], null, [["hum", 17.5], ["music", 15.65], ["whack, thwack", 13.06]], [["hum", 44.79], ["gong", 23.52], ["throbbing", 8.69]]], "duration": [4.63, 0.43, 3.97, 0.84, 0.06, 0.03, -0.16, 3.22, 0.86, 28.44, 22.86]} \ No newline at end of file diff --git a/annotations_filtered/uzgQ_xwWlkQ_filtered.json b/annotations_filtered/uzgQ_xwWlkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1022607678fbee06a32aad9e9a6f5e9b2ea4dd9 --- /dev/null +++ b/annotations_filtered/uzgQ_xwWlkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.93], [20.0, 20.55], [22.0, 36.64], [40.0, 78.75], [80.0, 93.33], [96.0, 118.0], [122.0, 126.54], [134.0, 134.65], [137.0, 137.27], [141.0, 143.99], [152.0, 152.27], [153.0, 156.32], [161.0, 162.04], [163.0, 168.4], [173.0, 174.07]], "keep_status": [true, false, true, false, false, true, true, false, false, false, false, true, false, false, false], "silence_prob": [36.22, 0.0, 32.06, 0.0, 29.97, 30.62, 31.25, 0.0, 0.0, 42.76, 0.0, 45.69, 0.0, 52.92, 0.0], "audiomae_on_audioset": [[["speech", 20.06], ["fart", 9.13], ["fireworks", 7.07]], null, [["music", 28.33], ["livestock, farm animals, working animals", 20.59], ["cattle, bovinae", 18.15]], null, [["speech", 48.52], ["music", 27.11], ["didgeridoo", 3.37]], [["music", 26.0], ["speech", 10.51], ["buzz", 9.73]], [["speech", 31.16], ["music", 25.38], ["vehicle", 3.76]], null, null, [["livestock, farm animals, working animals", 30.94], ["cattle, bovinae", 24.41], ["moo", 18.35]], null, [["music", 28.65], ["speech", 15.33], ["theremin", 12.95]], null, null, null], "duration": [5.93, 0.55, 14.64, 38.75, 13.33, 22.0, 4.54, 0.65, 0.27, 2.99, 0.27, 3.32, 1.04, 5.4, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/uzhsjyHUBt8_filtered.json b/annotations_filtered/uzhsjyHUBt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56feded97cf54ebe456321fb935d25181bf1c4e8 --- /dev/null +++ b/annotations_filtered/uzhsjyHUBt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [7.0, 9.07], [23.0, 22.94], [41.0, 41.54], [57.0, 57.32], [64.0, 65.91], [68.0, 68.4], [69.0, 74.76], [77.0, 77.25], [78.0, 79.81], [81.0, 81.28], [88.0, 88.84], [108.0, 108.58], [109.0, 111.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 2.07, -0.06, 0.54, 0.32, 1.91, 0.4, 5.76, 0.25, 1.81, 0.28, 0.84, 0.58, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/uztZUqKrHVo_filtered.json b/annotations_filtered/uztZUqKrHVo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3a811db6d546138a283e8e3b02c945ac579d71c --- /dev/null +++ b/annotations_filtered/uztZUqKrHVo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.17], [24.0, 24.61], [27.0, 27.14], [28.0, 35.92], [36.0, 37.32], [47.0, 46.58], [47.0, 49.59], [60.0, 61.8], [64.0, 70.83], [73.0, 74.55], [87.0, 88.92], [89.0, 88.96], [89.0, 88.99], [96.0, 96.48], [98.0, 130.99]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [60.89, 0.0, 0.0, 64.29, 0.0, 0.0, 53.1, 0.0, 34.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 33.49], ["livestock, farm animals, working animals", 13.19], ["groan", 8.73]], null, null, null, null, null, null], "duration": [9.17, 0.61, 0.14, 7.92, 1.32, -0.42, 2.59, 1.8, 6.83, 1.55, 1.92, -0.04, -0.01, 0.48, 32.99]} \ No newline at end of file diff --git a/annotations_filtered/v-0Z_0SUtJw_filtered.json b/annotations_filtered/v-0Z_0SUtJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1243bcbd394c98c5edfce018471f706a5d56c91e --- /dev/null +++ b/annotations_filtered/v-0Z_0SUtJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [7.0, 39.92], [41.0, 42.26], [43.0, 58.62], [60.0, 60.34], [62.0, 66.24], [70.0, 85.14], [87.0, 103.74]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.71, 0.0, 80.29, 87.92, 87.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.41, 32.92, 1.26, 15.62, 0.34, 4.24, 15.14, 16.74]} \ No newline at end of file diff --git a/annotations_filtered/v-OKZSh7tQ4_filtered.json b/annotations_filtered/v-OKZSh7tQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bee1238f56cc25f01b2f69daf6827b628ff3af5 --- /dev/null +++ b/annotations_filtered/v-OKZSh7tQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.33], [40.0, 42.5], [60.0, 61.15], [71.0, 72.08], [80.0, 86.0], [95.0, 96.13], [101.0, 114.02], [116.0, 116.67]], "keep_status": [false, true, false, false, true, false, true, false], "silence_prob": [31.16, 29.72, 0.0, 0.0, 31.54, 0.0, 37.03, 0.0], "audiomae_on_audioset": [[["music", 60.51], ["speech", 9.92], ["hum", 6.27]], [["sheep", 27.77], ["bleat", 17.43], ["speech", 12.33]], null, null, [["music", 41.25], ["whack, thwack", 9.0], ["cattle, bovinae", 4.01]], null, [["music", 55.97], ["fly, housefly", 6.77], ["buzz", 4.4]], null], "duration": [5.33, 2.5, 1.15, 1.08, 6.0, 1.13, 13.02, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/v-OP9DnMN-w_filtered.json b/annotations_filtered/v-OP9DnMN-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd30e91639087858bcd4d8f59238b8be216ab967 --- /dev/null +++ b/annotations_filtered/v-OP9DnMN-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 7.3], [15.0, 15.45], [20.0, 26.05], [27.0, 76.64], [77.0, 78.14], [80.0, 128.41]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 34.43], ["mains hum", 17.03], ["music", 15.89]], null, null, null], "duration": [0.5, 1.3, 0.45, 6.05, 49.64, 1.14, 48.41]} \ No newline at end of file diff --git a/annotations_filtered/v-WZINgHnFQ_filtered.json b/annotations_filtered/v-WZINgHnFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514230234c6e51fe4ab30504ea8ce47a555549fb --- /dev/null +++ b/annotations_filtered/v-WZINgHnFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [5.0, 5.8], [13.0, 12.92], [15.0, 15.5], [20.0, 20.76], [22.0, 22.81], [24.0, 24.83], [27.0, 27.08], [51.0, 51.46], [61.0, 60.76], [64.0, 65.28], [69.0, 69.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.8, -0.08, 0.5, 0.76, 0.81, 0.83, 0.08, 0.46, -0.24, 1.28, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/v-fwHV86PgY_filtered.json b/annotations_filtered/v-fwHV86PgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b89034e3ca27f593804627c7885025712b3682cd --- /dev/null +++ b/annotations_filtered/v-fwHV86PgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.56], [19.0, 19.31], [20.0, 23.26], [29.0, 29.73], [32.0, 31.94]], "keep_status": [false, false, true, false, false], "silence_prob": [30.32, 0.0, 35.59, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 43.02], ["speech", 24.96], ["chop", 3.54]], null, [["speech", 35.0], ["music", 9.42], ["beatboxing", 5.25]], null, null], "duration": [6.56, 0.31, 3.26, 0.73, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/v-tma5YRyGg_filtered.json b/annotations_filtered/v-tma5YRyGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aadfb1ee09d9feb96f5d7eeb35b14df379b75dc5 --- /dev/null +++ b/annotations_filtered/v-tma5YRyGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [16.0, 22.55], [23.0, 25.49]], "keep_status": [false, true, true], "silence_prob": [0.0, 42.84, 35.9], "audiomae_on_audioset": [null, [["music", 36.15], ["ice cream truck, ice cream van", 27.69], ["patter", 3.14]], [["music", 35.87], ["speech", 23.89], ["marimba, xylophone", 8.4]]], "duration": [0.65, 6.55, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/v00zKyXbfD4_filtered.json b/annotations_filtered/v00zKyXbfD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19322d6cdd7d900fa5d9aa6ed7f87095f3590a38 --- /dev/null +++ b/annotations_filtered/v00zKyXbfD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 150.45], [150.0, 150.85]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [140.45, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/v04j4-SBv9M_filtered.json b/annotations_filtered/v04j4-SBv9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903b06f6059c4a9c733c002e34ef588bc4f23710 --- /dev/null +++ b/annotations_filtered/v04j4-SBv9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [2.0, 20.28], [20.0, 21.05], [21.0, 37.44], [39.0, 51.63], [61.0, 61.43], [85.0, 85.53], [86.0, 86.19], [87.0, 87.29], [90.0, 91.77]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.89, 0.0, 28.85, 30.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 32.69], ["didgeridoo", 12.57], ["gong", 5.22]], null, [["speech", 28.0], ["buzz", 18.83], ["vehicle", 14.03]], [["music", 68.5], ["synthesizer", 4.98], ["hum", 4.91]], null, null, null, null, null], "duration": [0.46, 18.28, 1.05, 16.44, 12.63, 0.43, 0.53, 0.19, 0.29, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/v0AyEpFDi48_filtered.json b/annotations_filtered/v0AyEpFDi48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02513b53273861476ea2e2b0a17ed5749ca14c85 --- /dev/null +++ b/annotations_filtered/v0AyEpFDi48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 27.75], [28.0, 44.95], [48.0, 51.0], [52.0, 116.46], [122.0, 148.51], [153.0, 153.57], [154.0, 154.9], [159.0, 159.6], [161.0, 181.04], [183.0, 242.1]], "keep_status": [true, true, true, false, true, false, false, false, true, false], "silence_prob": [28.74, 29.06, 31.48, 0.0, 28.87, 0.0, 0.0, 0.0, 28.87, 0.0], "audiomae_on_audioset": [[["car", 15.52], ["vehicle", 15.48], ["music", 8.33]], [["speech", 22.11], ["hum", 18.88], ["mains hum", 14.79]], [["music", 18.29], ["speech", 15.86], ["whale vocalization", 10.14]], null, [["music", 41.28], ["speech", 12.94], ["mains hum", 6.46]], null, null, null, [["music", 50.0], ["throbbing", 9.85], ["hum", 8.65]], null], "duration": [14.75, 16.95, 3.0, 64.46, 26.51, 0.57, 0.9, 0.6, 20.04, 59.1]} \ No newline at end of file diff --git a/annotations_filtered/v0gGWiRkjYM_filtered.json b/annotations_filtered/v0gGWiRkjYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcf11e09ed433c5b832e0911a9f56c822ae2656f --- /dev/null +++ b/annotations_filtered/v0gGWiRkjYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 8.73], [11.0, 19.47], [35.0, 39.63], [50.0, 58.06], [66.0, 79.59], [83.0, 93.34], [96.0, 109.49], [116.0, 130.82]], "keep_status": [false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 62.17, 41.1, 31.34, 31.23, 31.35, 31.26, 31.69, 30.66], "audiomae_on_audioset": [null, null, [["music", 37.7], ["keyboard (musical)", 18.53], ["piano", 15.71]], [["music", 56.25], ["speech", 8.94], ["synthesizer", 4.35]], [["music", 84.52], ["swing music", 1.95], ["musical instrument", 0.85]], [["music", 83.31], ["funk", 1.44], ["singing", 0.79]], [["music", 79.37], ["musical instrument", 3.29], ["didgeridoo", 1.61]], [["music", 38.47], ["didgeridoo", 14.93], ["cattle, bovinae", 14.0]], [["music", 81.32], ["didgeridoo", 4.57], ["speech", 2.72]]], "duration": [1.13, 5.73, 8.47, 4.63, 8.06, 13.59, 10.34, 13.49, 14.82]} \ No newline at end of file diff --git a/annotations_filtered/v1Qu3dZlRGE_filtered.json b/annotations_filtered/v1Qu3dZlRGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25565d2b99f9a6413497ea7ec4b79809d0d61ca5 --- /dev/null +++ b/annotations_filtered/v1Qu3dZlRGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.17], [2.0, 3.21], [5.0, 5.27], [7.0, 12.9], [13.0, 17.39], [19.0, 19.18], [22.0, 30.55], [43.0, 43.12], [44.0, 61.3], [63.0, 64.4], [66.0, 66.8], [69.0, 68.93], [69.0, 69.84], [71.0, 74.01], [74.0, 74.44], [75.0, 74.66], [76.0, 89.77], [91.0, 96.3], [98.0, 98.47], [103.0, 120.8], [123.0, 124.9], [126.0, 127.2], [129.0, 129.9], [133.0, 137.27], [139.0, 147.24], [147.0, 147.34], [147.0, 175.49], [176.0, 177.43]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 82.61, 44.81, 0.0, 80.29, 0.0, 36.84, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 52.22, 78.55, 0.0, 50.36, 0.0, 0.0, 0.0, 39.94, 31.86, 0.0, 39.99, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 38.83], ["mains hum", 9.62], ["radio", 8.55]], null, null, null, [["electric shaver, electric razor", 36.25], ["sidetone", 18.53], ["fly, housefly", 7.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.71], ["hum", 14.62], ["electric shaver, electric razor", 11.52]], [["speech", 29.39], ["noise", 8.83], ["cattle, bovinae", 7.06]], null, [["insect", 34.99], ["speech", 25.08], ["fly, housefly", 16.44]], null], "duration": [0.17, 1.21, 0.27, 5.9, 4.39, 0.18, 8.55, 0.12, 17.3, 1.4, 0.8, -0.07, 0.84, 3.01, 0.44, -0.34, 13.77, 5.3, 0.47, 17.8, 1.9, 1.2, 0.9, 4.27, 8.24, 0.34, 28.49, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/v1dTnLPL9gU_filtered.json b/annotations_filtered/v1dTnLPL9gU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6314a1fb3cedd73dc066fc5e5072388fcf86aa7b --- /dev/null +++ b/annotations_filtered/v1dTnLPL9gU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.17], [23.0, 25.41], [27.0, 28.41], [31.0, 44.0], [63.0, 63.9], [67.0, 68.2], [72.0, 72.27], [79.0, 79.39], [83.0, 83.29], [90.0, 96.23], [118.0, 119.47], [123.0, 123.08], [129.0, 129.25], [132.0, 133.32], [139.0, 143.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.95, 0.0, 45.05, 0.0, 0.0, 0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0, 46.19], "audiomae_on_audioset": [null, [["music", 75.1], ["video game music", 3.05], ["musical instrument", 2.23]], null, [["music", 69.79], ["livestock, farm animals, working animals", 3.52], ["keyboard (musical)", 2.92]], null, null, null, null, null, [["music", 40.98], ["boing", 38.51], ["music for children", 3.27]], null, null, null, null, [["music", 54.33], ["chorus effect", 13.37], ["synthesizer", 5.57]]], "duration": [1.17, 2.41, 1.41, 13.0, 0.9, 1.2, 0.27, 0.39, 0.29, 6.23, 1.47, 0.08, 0.25, 1.32, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/v1ordVEmJQQ_filtered.json b/annotations_filtered/v1ordVEmJQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e92cb8dedeaff911c52868bdb27df6ae0fc965d --- /dev/null +++ b/annotations_filtered/v1ordVEmJQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.34], [7.0, 19.77], [21.0, 100.43], [104.0, 134.94], [136.0, 141.52], [146.0, 151.29], [154.0, 160.54], [161.0, 162.82], [163.0, 163.73], [164.0, 165.0], [166.0, 166.97], [167.0, 168.64], [170.0, 170.26], [172.0, 172.72], [173.0, 173.99], [176.0, 177.03], [178.0, 181.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 85.54, 0.0, 0.0, 38.22, 55.39, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, [["music", 74.67], ["musical instrument", 2.24], ["brass instrument", 1.62]], null, [["music", 62.15], ["mosquito", 8.34], ["fly, housefly", 4.59]], null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 12.77, 79.43, 30.94, 5.52, 5.29, 6.54, 1.82, 0.73, 1.0, 0.97, 1.64, 0.26, 0.72, 0.99, 1.03, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/v2KtG9kFZOI_filtered.json b/annotations_filtered/v2KtG9kFZOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed5bfb27da4697ed027b500af0f1d3c46872ef3 --- /dev/null +++ b/annotations_filtered/v2KtG9kFZOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 37.88], [43.0, 57.59], [60.0, 75.37], [87.0, 99.87], [101.0, 113.88]], "keep_status": [false, true, true, true, false], "silence_prob": [31.09, 30.48, 30.78, 31.47, 31.94], "audiomae_on_audioset": [[["music", 63.35], ["throbbing", 12.83], ["didgeridoo", 5.39]], [["speech", 36.44], ["music", 18.16], ["hum", 14.83]], [["speech", 29.21], ["buzz", 28.37], ["music", 12.14]], [["speech", 41.34], ["buzz", 17.61], ["vehicle", 4.87]], [["throbbing", 39.32], ["hum", 27.31], ["music", 17.51]]], "duration": [14.88, 14.59, 15.37, 12.87, 12.88]} \ No newline at end of file diff --git a/annotations_filtered/v2pWzqZqTyk_filtered.json b/annotations_filtered/v2pWzqZqTyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb674313770578b5fb46f825f020b4321676cff2 --- /dev/null +++ b/annotations_filtered/v2pWzqZqTyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.45], [15.0, 17.88], [26.0, 28.78], [37.0, 37.15], [38.0, 38.28], [39.0, 41.07], [41.0, 42.96], [43.0, 45.35], [46.0, 46.23], [47.0, 47.44], [49.0, 49.45], [50.0, 51.7], [59.0, 59.32], [61.0, 61.7], [65.0, 66.39], [67.0, 67.93], [69.0, 69.57], [71.0, 74.83], [76.0, 76.57], [77.0, 78.66], [80.0, 79.98], [80.0, 80.64], [81.0, 82.09], [85.0, 85.63], [90.0, 90.24], [92.0, 93.19], [96.0, 95.88], [100.0, 100.31]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.32, 29.02, 0.0, 0.0, 33.53, 0.0, 45.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 24.81], ["hum", 14.71], ["mains hum", 7.56]], [["speech", 82.73], ["music", 2.94], ["hubbub, speech noise, speech babble", 1.09]], null, null, [["vehicle", 16.94], ["motorcycle", 11.53], ["car", 7.77]], null, [["cattle, bovinae", 23.8], ["horse", 15.64], ["clip-clop", 15.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 2.88, 2.78, 0.15, 0.28, 2.07, 1.96, 2.35, 0.23, 0.44, 0.45, 1.7, 0.32, 0.7, 1.39, 0.93, 0.57, 3.83, 0.57, 1.66, -0.02, 0.64, 1.09, 0.63, 0.24, 1.19, -0.12, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/v2qDlGbaqSQ_filtered.json b/annotations_filtered/v2qDlGbaqSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d1010b1f622f91ada30107f928cb210c9ff2dc7 --- /dev/null +++ b/annotations_filtered/v2qDlGbaqSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [5.0, 13.19], [18.0, 19.2], [24.0, 26.2], [28.0, 29.13], [31.0, 32.54], [35.0, 35.77], [38.0, 38.92], [42.0, 45.05], [47.0, 47.82], [50.0, 51.7], [55.0, 55.12], [56.0, 58.5], [63.0, 64.77], [75.0, 81.38], [83.0, 84.4], [86.0, 87.45], [90.0, 94.14], [97.0, 96.89], [97.0, 100.11], [105.0, 119.94], [126.0, 126.3], [129.0, 130.79], [135.0, 138.25], [142.0, 147.24], [149.0, 149.28], [154.0, 155.34], [156.0, 158.7], [161.0, 161.76], [163.0, 165.01], [167.0, 166.85], [168.0, 171.75], [174.0, 175.09], [180.0, 183.25], [185.0, 189.33], [199.0, 199.77], [200.0, 200.82], [203.0, 204.01], [210.0, 214.83], [216.0, 221.83], [224.0, 230.32], [233.0, 233.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 70.86, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 75.88, 0.0, 74.44, 0.0, 0.0, 50.56, 0.0, 60.98, 47.43, 0.0, 0.0, 47.39, 53.78, 0.0, 0.0, 60.32, 0.0, 58.13, 0.0, 59.42, 0.0, 56.63, 53.72, 0.0, 0.0, 0.0, 46.26, 60.51, 63.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.09], ["cello", 6.63], ["double bass", 5.88]], null, null, [["music", 55.6], ["theremin", 24.22], ["cello", 2.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.17], ["guitar", 4.09], ["musical instrument", 3.63]], null, null, null], "duration": [2.09, 8.19, 1.2, 2.2, 1.13, 1.54, 0.77, 0.92, 3.05, 0.82, 1.7, 0.12, 2.5, 1.77, 6.38, 1.4, 1.45, 4.14, -0.11, 3.11, 14.94, 0.3, 1.79, 3.25, 5.24, 0.28, 1.34, 2.7, 0.76, 2.01, -0.15, 3.75, 1.09, 3.25, 4.33, 0.77, 0.82, 1.01, 4.83, 5.83, 6.32, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/v3E4s7VN4xE_filtered.json b/annotations_filtered/v3E4s7VN4xE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53528e3fd1d76000b76d18bd413b610671ceacf2 --- /dev/null +++ b/annotations_filtered/v3E4s7VN4xE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [4.0, 6.51], [9.0, 12.38], [20.0, 21.56], [25.0, 26.22], [27.0, 29.32], [32.0, 34.7], [47.0, 48.57], [50.0, 56.78], [60.0, 60.44], [62.0, 64.62], [67.0, 70.17], [73.0, 73.2], [74.0, 75.63], [89.0, 92.18], [93.0, 96.03], [106.0, 108.4], [110.0, 110.46], [111.0, 111.57], [115.0, 117.34]], "keep_status": [false, false, false, false, false, true, true, false, true, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 100.0, 79.24, 0.0, 0.0, 42.13, 33.6, 0.0, 42.53, 0.0, 33.65, 34.41, 0.0, 0.0, 36.61, 39.67, 42.04, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.4], ["crow", 6.86], ["speech", 4.33]], [["speech", 38.27], ["music", 25.62], ["hum", 3.96]], null, [["speech", 59.36], ["music", 7.29], ["ding", 3.2]], null, [["music", 39.91], ["synthesizer", 5.61], ["musical instrument", 3.21]], [["music", 46.17], ["speech", 22.06], ["hum", 4.88]], null, null, [["music", 30.36], ["fly, housefly", 15.99], ["insect", 5.12]], [["music", 31.81], ["speech", 27.88], ["musical instrument", 2.78]], [["quack", 43.43], ["music", 32.0], ["duck", 10.71]], null, null, null], "duration": [0.75, 2.51, 3.38, 1.56, 1.22, 2.32, 2.7, 1.57, 6.78, 0.44, 2.62, 3.17, 0.2, 1.63, 3.18, 3.03, 2.4, 0.46, 0.57, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/v3H9-sHDZSA_filtered.json b/annotations_filtered/v3H9-sHDZSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41576f129761479496630f60d2fb24995041e35a --- /dev/null +++ b/annotations_filtered/v3H9-sHDZSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [4.0, 5.14], [7.0, 7.57], [13.0, 14.76], [28.0, 29.4], [32.0, 33.94], [37.0, 37.54], [41.0, 95.28], [96.0, 104.7], [105.0, 131.3], [132.0, 137.32], [139.0, 139.73], [140.0, 140.36]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.37, 29.05, 34.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["throbbing", 9.56], ["hum", 8.81], ["sonar", 7.19]], [["speech", 36.82], ["breaking", 17.95], ["noise", 14.02]], [["music", 48.02], ["speech", 9.45], ["synthesizer", 4.25]], null, null], "duration": [0.83, 1.14, 0.57, 1.76, 1.4, 1.94, 0.54, 54.28, 8.7, 26.3, 5.32, 0.73, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/v3IyV96FX74_filtered.json b/annotations_filtered/v3IyV96FX74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35c563e794b284d6fc9d60965c388b8ebf2291e1 --- /dev/null +++ b/annotations_filtered/v3IyV96FX74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.56], [5.0, 7.32], [9.0, 14.99], [18.0, 18.35], [18.0, 18.45], [19.0, 25.66], [47.0, 47.92], [49.0, 49.82], [52.0, 52.76], [53.0, 66.12], [67.0, 68.81], [71.0, 84.13], [85.0, 91.27], [92.0, 93.77], [95.0, 97.39], [99.0, 101.49], [103.0, 103.54], [106.0, 108.01], [110.0, 112.77], [113.0, 115.75]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.22, 39.57, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 55.53, 0.0, 33.45, 33.14, 0.0, 89.72, 81.71, 0.0, 93.45, 57.72, 65.2], "audiomae_on_audioset": [null, [["music", 40.35], ["french horn", 7.43], ["musical instrument", 6.41]], [["music", 43.97], ["speech", 10.61], ["synthesizer", 4.53]], null, null, [["theremin", 34.1], ["music", 30.8], ["speech", 11.82]], null, null, null, null, null, [["music", 49.41], ["theremin", 25.08], ["synthesizer", 7.38]], [["music", 71.2], ["theremin", 7.47], ["synthesizer", 4.51]], null, null, null, null, null, null, null], "duration": [-0.44, 2.32, 5.99, 0.35, 0.45, 6.66, 0.92, 0.82, 0.76, 13.12, 1.81, 13.13, 6.27, 1.77, 2.39, 2.49, 0.54, 2.01, 2.77, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/v3JlEi3CbGI_filtered.json b/annotations_filtered/v3JlEi3CbGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c297b76edbe290021c052cd33a1afde3189a3fb9 --- /dev/null +++ b/annotations_filtered/v3JlEi3CbGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.07], [8.0, 9.46], [11.0, 12.78], [30.0, 30.62], [33.0, 36.21], [40.0, 40.76], [45.0, 45.39], [50.0, 50.57], [56.0, 65.01], [66.0, 73.85], [74.0, 76.2], [78.0, 81.94], [82.0, 83.27], [85.0, 88.77], [92.0, 92.18], [95.0, 95.89], [97.0, 97.65], [100.0, 99.74], [102.0, 103.89], [105.0, 105.61], [107.0, 107.74], [109.0, 110.27], [116.0, 117.05], [119.0, 119.87], [120.0, 121.17], [125.0, 125.93], [129.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.84, 99.91, 63.42, 99.9, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 1.46, 1.78, 0.62, 3.21, 0.76, 0.39, 0.57, 9.01, 7.85, 2.2, 3.94, 1.27, 3.77, 0.18, 0.89, 0.65, -0.26, 1.89, 0.61, 0.74, 1.27, 1.05, 0.87, 1.17, 0.93, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/v3aqGRzL0BY_filtered.json b/annotations_filtered/v3aqGRzL0BY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bc0f567778587256ca4131d51d36bd92f7975e1 --- /dev/null +++ b/annotations_filtered/v3aqGRzL0BY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[105.0, 105.65]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.65]} \ No newline at end of file diff --git a/annotations_filtered/v3bQ1GiWhJk_filtered.json b/annotations_filtered/v3bQ1GiWhJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/v3bQ1GiWhJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/v3bWb5qZMu8_filtered.json b/annotations_filtered/v3bWb5qZMu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..154d1eeff08f5aa797f6f67fbcf38dec53bd8974 --- /dev/null +++ b/annotations_filtered/v3bWb5qZMu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 80.72], [81.0, 131.82], [132.0, 138.89], [139.0, 139.55], [140.0, 141.03], [142.0, 142.28], [143.0, 146.96], [147.0, 150.35], [158.0, 170.68], [176.0, 176.49]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.87, 0.0, 0.0, 0.0, 45.92, 37.35, 32.81, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 55.2], ["animal", 4.15], ["fowl", 3.69]], null, null, null, [["music", 24.23], ["speech", 23.55], ["electric shaver, electric razor", 6.94]], [["cowbell", 31.44], ["moo", 20.69], ["cattle, bovinae", 19.86]], [["speech", 59.06], ["electric shaver, electric razor", 8.85], ["hum", 4.35]], null], "duration": [0.44, 76.72, 50.82, 6.89, 0.55, 1.03, 0.28, 3.96, 3.35, 12.68, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/v3dCP69-IFU_filtered.json b/annotations_filtered/v3dCP69-IFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59fa9ab08a94ca92edc7bb0aa14f002fd5b76fd2 --- /dev/null +++ b/annotations_filtered/v3dCP69-IFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.85], [23.0, 27.45], [45.0, 47.76], [54.0, 74.21], [78.0, 79.54], [81.0, 81.6], [82.0, 82.63], [84.0, 85.18], [87.0, 87.34], [89.0, 89.14], [91.0, 112.48], [115.0, 121.41], [123.0, 126.2]], "keep_status": [false, true, true, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 48.06, 41.93, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.01, 46.09, 67.13], "audiomae_on_audioset": [null, [["crushing", 41.3], ["door", 11.43], ["squish", 6.86]], [["speech", 26.43], ["crack", 6.48], ["skateboard", 6.22]], [["music", 50.43], ["noise", 10.43], ["hum", 5.55]], null, null, null, null, null, null, [["music", 24.6], ["buzz", 14.8], ["insect", 12.15]], [["sidetone", 30.19], ["speech", 24.79], ["hum", 9.2]], null], "duration": [1.85, 4.45, 2.76, 20.21, 1.54, 0.6, 0.63, 1.18, 0.34, 0.14, 21.48, 6.41, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/v3e2maV8MlQ_filtered.json b/annotations_filtered/v3e2maV8MlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aefa3ba4dae325fecf79c574602b6e150367f1e --- /dev/null +++ b/annotations_filtered/v3e2maV8MlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 39.39], [41.0, 41.86], [43.0, 45.4], [46.0, 47.98], [51.0, 54.26], [55.0, 66.58], [70.0, 95.77], [97.0, 97.09], [98.0, 129.2]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [72.01, 0.0, 84.25, 0.0, 53.53, 49.27, 32.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.91], ["scary music", 7.4], ["theremin", 6.54]], [["music", 73.93], ["hum", 9.39], ["electronic music", 2.71]], null, null], "duration": [13.39, 0.86, 2.4, 1.98, 3.26, 11.58, 25.77, 0.09, 31.2]} \ No newline at end of file diff --git a/annotations_filtered/v4P4cS5jKmQ_filtered.json b/annotations_filtered/v4P4cS5jKmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..345628db3a3f34e67e613fb580d30d65a6d9e1fb --- /dev/null +++ b/annotations_filtered/v4P4cS5jKmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.5], [7.0, 8.02], [9.0, 9.63], [12.0, 12.58], [13.0, 14.98], [16.0, 16.78], [19.0, 19.4], [24.0, 23.77], [24.0, 25.79], [30.0, 32.19], [34.0, 36.07], [38.0, 38.7], [41.0, 44.04], [45.0, 45.57], [47.0, 47.48], [48.0, 48.74], [51.0, 51.73], [53.0, 53.2], [62.0, 62.24], [72.0, 73.5], [76.0, 76.6], [80.0, 79.56], [91.0, 91.49], [92.0, 93.06], [95.0, 98.59], [102.0, 103.81], [109.0, 128.38], [129.0, 132.21], [138.0, 138.96], [142.0, 144.05], [146.0, 147.97], [150.0, 152.52], [156.0, 159.71], [161.0, 162.38], [170.0, 170.09], [173.0, 174.95], [175.0, 177.21], [180.0, 180.44], [182.0, 182.78], [184.0, 184.84], [186.0, 186.78], [188.0, 189.95], [191.0, 192.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 99.85, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 99.44, 100.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 1.02, 0.63, 0.58, 1.98, 0.78, 0.4, -0.23, 1.79, 2.19, 2.07, 0.7, 3.04, 0.57, 0.48, 0.74, 0.73, 0.2, 0.24, 1.5, 0.6, -0.44, 0.49, 1.06, 3.59, 1.81, 19.38, 3.21, 0.96, 2.05, 1.97, 2.52, 3.71, 1.38, 0.09, 1.95, 2.21, 0.44, 0.78, 0.84, 0.78, 1.95, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/v4U2mAwO6-4_filtered.json b/annotations_filtered/v4U2mAwO6-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d04efef44f92c3fb2a9a042917b85bec799bc967 --- /dev/null +++ b/annotations_filtered/v4U2mAwO6-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 5.46], [6.0, 7.97], [9.0, 9.76], [11.0, 11.15], [11.0, 12.31], [13.0, 15.55], [17.0, 19.18], [20.0, 23.33], [25.0, 28.07], [35.0, 37.12], [45.0, 47.14], [49.0, 53.45], [55.0, 68.64], [70.0, 70.63], [72.0, 73.43], [74.0, 75.39], [76.0, 77.45], [79.0, 79.08], [82.0, 82.63], [84.0, 84.55], [86.0, 87.15], [88.0, 90.07], [91.0, 93.02], [94.0, 95.52], [98.0, 97.73], [98.0, 101.38], [103.0, 106.02], [107.0, 109.54], [110.0, 111.7], [113.0, 113.97], [116.0, 117.8], [119.0, 124.01], [125.0, 126.69], [128.0, 135.23], [138.0, 143.01], [144.0, 145.0], [148.0, 150.72], [152.0, 152.2], [155.0, 157.13], [158.0, 158.6], [161.0, 163.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.37, 99.92, 99.48, 93.13, 96.89, 97.73, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 99.68, 0.0, 0.0, 95.51, 84.07, 82.43, 0.0, 0.0, 0.0, 88.46, 0.0, 77.36, 89.01, 0.0, 71.0, 0.0, 75.23, 0.0, 37.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.29], ["insect", 9.09], ["fly, housefly", 6.72]]], "duration": [1.56, 1.46, 1.97, 0.76, 0.15, 1.31, 2.55, 2.18, 3.33, 3.07, 2.12, 2.14, 4.45, 13.64, 0.63, 1.43, 1.39, 1.45, 0.08, 0.63, 0.55, 1.15, 2.07, 2.02, 1.52, -0.27, 3.38, 3.02, 2.54, 1.7, 0.97, 1.8, 5.01, 1.69, 7.23, 5.01, 1.0, 2.72, 0.2, 2.13, 0.6, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/v4Zjie4qH04_filtered.json b/annotations_filtered/v4Zjie4qH04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80f1949a1b108e209a09701ab21c4af409493aeb --- /dev/null +++ b/annotations_filtered/v4Zjie4qH04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.31], [6.0, 18.39], [22.0, 23.48], [25.0, 27.99], [31.0, 36.07], [37.0, 37.5], [42.0, 43.36], [44.0, 45.74], [47.0, 48.29], [49.0, 49.13], [51.0, 64.45], [74.0, 74.88], [76.0, 76.59], [82.0, 81.78], [85.0, 87.71], [88.0, 90.58], [91.0, 96.43], [97.0, 105.12], [105.0, 106.73], [108.0, 110.27], [111.0, 110.71], [112.0, 114.88], [121.0, 122.42], [127.0, 129.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 93.76, 0.0, 100.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 94.37, 85.9, 94.22, 82.07, 0.0, 99.99, 0.0, 90.95, 0.0, 62.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.31, 12.39, 1.48, 2.99, 5.07, 0.5, 1.36, 1.74, 1.29, 0.13, 13.45, 0.88, 0.59, -0.22, 2.71, 2.58, 5.43, 8.12, 1.73, 2.27, -0.29, 2.88, 1.42, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/v4kXrblmBE8_filtered.json b/annotations_filtered/v4kXrblmBE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14383ba0b0497718b39a34595e8b4e0e63021e8d --- /dev/null +++ b/annotations_filtered/v4kXrblmBE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [5.0, 5.98], [8.0, 8.51], [9.0, 15.63], [17.0, 18.08], [21.0, 23.03], [28.0, 29.94], [42.0, 52.22], [55.0, 55.56], [56.0, 57.87], [59.0, 61.1], [61.0, 65.67], [66.0, 74.33], [87.0, 89.7], [91.0, 92.11], [97.0, 100.48], [105.0, 110.27], [113.0, 121.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.55, 0.0, 94.66, 0.0, 68.93, 0.0, 0.0, 97.0, 97.54, 94.95, 93.6, 0.0, 89.01, 65.55, 61.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.98, 0.51, 6.63, 1.08, 2.03, 1.94, 10.22, 0.56, 1.87, 2.1, 4.67, 8.33, 2.7, 1.11, 3.48, 5.27, 8.14]} \ No newline at end of file diff --git a/annotations_filtered/v4np7L0aJd0_filtered.json b/annotations_filtered/v4np7L0aJd0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c3cde24bb45eaf4105cb294bb4639da42815fe0 --- /dev/null +++ b/annotations_filtered/v4np7L0aJd0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.75], [6.0, 7.75], [8.0, 8.67], [13.0, 13.85], [18.0, 17.96], [18.0, 19.26], [22.0, 23.63], [28.0, 29.42], [30.0, 37.05], [39.0, 39.72], [43.0, 43.07], [51.0, 52.52], [54.0, 54.82], [56.0, 55.97], [57.0, 57.91], [58.0, 60.29], [61.0, 63.93], [64.0, 65.97], [68.0, 69.69], [72.0, 73.01], [81.0, 81.75], [90.0, 90.17], [92.0, 91.98], [93.0, 94.63], [96.0, 96.03], [99.0, 100.11], [111.0, 112.46], [119.0, 123.28], [124.0, 127.72], [129.0, 149.28]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.27, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 99.56, 32.08], "audiomae_on_audioset": [[["slam", 18.82], ["thunk", 12.29], ["door", 9.69]], null, null, null, null, null, null, null, [["speech", 39.2], ["moo", 16.35], ["cattle, bovinae", 15.45]], null, null, null, null, null, null, [["speech", 46.95], ["sidetone", 38.49], ["sine wave", 3.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.46], ["cattle, bovinae", 12.48], ["livestock, farm animals, working animals", 11.69]]], "duration": [3.75, 1.75, 0.67, 0.85, -0.04, 1.26, 1.63, 1.42, 7.05, 0.72, 0.07, 1.52, 0.82, -0.03, 0.91, 2.29, 2.93, 1.97, 1.69, 1.01, 0.75, 0.17, -0.02, 1.63, 0.03, 1.11, 1.46, 4.28, 3.72, 20.28]} \ No newline at end of file diff --git a/annotations_filtered/v5-gQQunvJw_filtered.json b/annotations_filtered/v5-gQQunvJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4e31e45c1324b1170cb9f5c75baab773952fd40 --- /dev/null +++ b/annotations_filtered/v5-gQQunvJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [5.0, 5.44], [6.0, 21.64], [23.0, 23.84], [26.0, 26.37], [28.0, 29.13], [36.0, 36.31], [38.0, 40.07], [42.0, 42.89], [47.0, 48.59], [52.0, 52.27], [57.0, 57.94], [59.0, 58.9], [59.0, 60.54], [64.0, 64.64], [65.0, 68.54], [70.0, 69.65], [71.0, 73.87], [80.0, 80.97], [86.0, 87.79], [93.0, 94.04], [97.0, 98.44], [101.0, 102.76], [104.0, 105.39], [110.0, 111.87], [114.0, 114.39], [116.0, 119.37], [120.0, 120.87], [122.0, 122.69], [123.0, 124.02], [127.0, 129.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 98.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.44, 15.64, 0.84, 0.37, 1.13, 0.31, 2.07, 0.89, 1.59, 0.27, 0.94, -0.1, 1.54, 0.64, 3.54, -0.35, 2.87, 0.97, 1.79, 1.04, 1.44, 1.76, 1.39, 1.87, 0.39, 3.37, 0.87, 0.69, 1.02, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/v53yiG9-_xs_filtered.json b/annotations_filtered/v53yiG9-_xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74c8fdfa0777ab410ecf634d6d4d19f25f042026 --- /dev/null +++ b/annotations_filtered/v53yiG9-_xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [8.0, 8.29], [9.0, 10.0], [11.0, 12.68], [14.0, 15.08], [17.0, 18.23], [21.0, 22.37], [24.0, 24.81], [32.0, 35.33], [38.0, 38.37], [40.0, 40.22], [41.0, 46.41], [47.0, 48.15], [49.0, 49.74], [51.0, 51.76], [54.0, 55.04], [57.0, 69.18], [81.0, 81.72], [88.0, 88.43], [90.0, 90.15], [91.0, 91.3], [92.0, 92.45], [93.0, 93.46], [96.0, 95.81], [98.0, 103.74], [106.0, 109.27], [110.0, 109.95], [110.0, 111.2], [113.0, 113.81], [114.0, 115.3], [117.0, 117.31], [119.0, 118.96], [123.0, 123.57], [125.0, 125.05], [126.0, 127.04], [130.0, 130.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 0.0, 34.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 44.68], ["hum", 14.49], ["throbbing", 6.55]], null, null, null, null, [["music", 69.28], ["synthesizer", 3.93], ["electronic music", 3.21]], null, null, null, null, null, null, null, [["whistling", 75.54], ["theremin", 10.39], ["music", 6.34]], [["whistling", 65.67], ["music", 19.69], ["speech", 3.16]], null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 0.29, 1.0, 1.68, 1.08, 1.23, 1.37, 0.81, 3.33, 0.37, 0.22, 5.41, 1.15, 0.74, 0.76, 1.04, 12.18, 0.72, 0.43, 0.15, 0.3, 0.45, 0.46, -0.19, 5.74, 3.27, -0.05, 1.2, 0.81, 1.3, 0.31, -0.04, 0.57, 0.05, 1.04, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/v5Co3A3fLBo_filtered.json b/annotations_filtered/v5Co3A3fLBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf799622553e0ccf80cbdc9737e2236c7dfb79ca --- /dev/null +++ b/annotations_filtered/v5Co3A3fLBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 142.48], [147.0, 146.89], [147.0, 148.02], [149.0, 149.32], [150.0, 150.42], [151.0, 154.63]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.82], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 14.46], ["whale vocalization", 14.32], ["noise", 11.16]]], "duration": [44.48, -0.11, 1.02, 0.32, 0.42, 3.63]} \ No newline at end of file diff --git a/annotations_filtered/v5FtI472Q6I_filtered.json b/annotations_filtered/v5FtI472Q6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f21edf80fa4ee9147d67a83eab0c609a5426c44e --- /dev/null +++ b/annotations_filtered/v5FtI472Q6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [7.0, 7.89], [12.0, 13.68], [15.0, 15.58], [18.0, 18.93], [21.0, 21.66], [23.0, 23.97], [26.0, 27.09], [28.0, 28.21], [31.0, 32.21], [33.0, 63.81], [64.0, 65.31], [66.0, 68.57], [70.0, 85.21], [87.0, 100.67], [101.0, 110.76], [112.0, 112.35], [113.0, 120.31], [121.0, 126.23], [127.0, 137.81], [139.0, 139.9], [140.0, 148.68], [151.0, 156.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.9, 58.3, 65.09, 50.61, 0.0, 51.23, 43.48, 52.68, 0.0, 37.35, 34.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 29.8], ["sidetone", 17.3], ["speech", 16.16]], null, null, null, null, null, [["speech", 39.45], ["hum", 13.75], ["rumble", 8.57]], null, null, [["sidetone", 14.77], ["hum", 13.18], ["rumble", 10.85]], [["hum", 14.48], ["speech", 7.21], ["slosh", 6.72]]], "duration": [0.2, 0.89, 1.68, 0.58, 0.93, 0.66, 0.97, 1.09, 0.21, 1.21, 30.81, 1.31, 2.57, 15.21, 13.67, 9.76, 0.35, 7.31, 5.23, 10.81, 0.9, 8.68, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/v5N1Aukm4Bo_filtered.json b/annotations_filtered/v5N1Aukm4Bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d827984fbb350983447959ca2ba782bcefaa34a --- /dev/null +++ b/annotations_filtered/v5N1Aukm4Bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [8.0, 10.03], [12.0, 12.85], [14.0, 22.81], [23.0, 24.07], [25.0, 51.21], [52.0, 116.19], [117.0, 154.16], [156.0, 175.39]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.72, 0.0, 67.76, 0.0, 46.15, 0.0, 0.0, 37.28], "audiomae_on_audioset": [null, null, null, null, null, [["music", 39.17], ["mains hum", 21.72], ["hum", 14.95]], null, null, [["music", 62.62], ["scary music", 19.96], ["foghorn", 7.11]]], "duration": [0.44, 2.03, 0.85, 8.81, 1.07, 26.21, 64.19, 37.16, 19.39]} \ No newline at end of file diff --git a/annotations_filtered/v5llnbqhLZM_filtered.json b/annotations_filtered/v5llnbqhLZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..070dd9682ebe22f488f952a37134530aa7fb9c6c --- /dev/null +++ b/annotations_filtered/v5llnbqhLZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [5.0, 9.76], [12.0, 13.78], [16.0, 28.86], [32.0, 35.68], [37.0, 66.61], [69.0, 70.75], [73.0, 72.76], [73.0, 77.8], [78.0, 83.03], [87.0, 87.54], [88.0, 88.59], [91.0, 91.35], [97.0, 96.99], [97.0, 102.59], [103.0, 131.58], [134.0, 144.02], [146.0, 166.67], [167.0, 168.94], [171.0, 174.19], [176.0, 178.21]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 32.33, 0.0, 30.03, 29.36, 30.98, 0.0, 0.0, 29.79, 31.29, 0.0, 0.0, 0.0, 0.0, 33.14, 29.84, 29.62, 31.15, 0.0, 92.48, 92.64], "audiomae_on_audioset": [null, [["music", 40.32], ["hum", 24.93], ["throbbing", 16.6]], null, [["hum", 31.06], ["music", 29.19], ["speech", 6.47]], [["music", 17.15], ["buzz", 16.02], ["rumble", 9.96]], [["hum", 22.62], ["grunt", 16.27], ["noise", 12.69]], null, null, [["music", 68.07], ["grunt", 11.07], ["didgeridoo", 3.11]], [["music", 53.86], ["scary music", 11.83], ["foghorn", 9.43]], null, null, null, null, [["didgeridoo", 17.03], ["fart", 14.02], ["music", 12.05]], [["music", 38.37], ["hum", 22.16], ["mains hum", 15.79]], [["music", 42.17], ["whale vocalization", 12.24], ["groan", 7.16]], [["hum", 23.23], ["music", 22.15], ["sonar", 16.7]], null, null, null], "duration": [1.34, 4.76, 1.78, 12.86, 3.68, 29.61, 1.75, -0.24, 4.8, 5.03, 0.54, 0.59, 0.35, -0.01, 5.59, 28.58, 10.02, 20.67, 1.94, 3.19, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/v5nIRiA5W-E_filtered.json b/annotations_filtered/v5nIRiA5W-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3be9b3b82f678222ab0c531b35e839f83f0e537 --- /dev/null +++ b/annotations_filtered/v5nIRiA5W-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.4], [9.0, 9.53], [16.0, 28.19], [33.0, 34.69], [41.0, 41.35], [45.0, 52.44], [53.0, 52.96], [54.0, 54.67], [55.0, 64.1], [65.0, 100.18]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.87, 0.0, 0.0, 31.03, 0.0, 0.0, 29.42, 0.0], "audiomae_on_audioset": [null, null, [["music", 23.92], ["livestock, farm animals, working animals", 13.93], ["mosquito", 13.1]], null, null, [["speech", 47.2], ["music", 18.88], ["grunt", 8.26]], null, null, [["cattle, bovinae", 38.03], ["livestock, farm animals, working animals", 19.59], ["moo", 19.59]], null], "duration": [1.4, 0.53, 12.19, 1.69, 0.35, 7.44, -0.04, 0.67, 9.1, 35.18]} \ No newline at end of file diff --git a/annotations_filtered/v5qwMeiEF0M_filtered.json b/annotations_filtered/v5qwMeiEF0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e34abc8c67b29e7a52420d49674025151510983 --- /dev/null +++ b/annotations_filtered/v5qwMeiEF0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.24], [7.0, 7.86], [9.0, 11.15], [13.0, 13.96], [15.0, 16.77], [22.0, 27.65], [29.0, 30.54], [34.0, 43.55], [45.0, 46.53], [47.0, 48.56], [49.0, 56.64], [60.0, 61.65], [63.0, 64.61], [76.0, 77.92], [79.0, 78.95], [81.0, 82.51], [85.0, 85.55], [114.0, 131.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.97, 0.0, 71.72, 0.0, 0.0, 60.32, 0.0, 78.55, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 46.05], ["mains hum", 39.32], ["music", 4.14]]], "duration": [2.24, 0.86, 2.15, 0.96, 1.77, 5.65, 1.54, 9.55, 1.53, 1.56, 7.64, 1.65, 1.61, 1.92, -0.05, 1.51, 0.55, 17.65]} \ No newline at end of file diff --git a/annotations_filtered/v5ueLuyLWn4_filtered.json b/annotations_filtered/v5ueLuyLWn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..200049129c3747587838d75ab4a47d30118604dc --- /dev/null +++ b/annotations_filtered/v5ueLuyLWn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.84], [6.0, 21.29], [22.0, 22.92], [24.0, 25.41], [27.0, 31.38], [33.0, 35.5], [39.0, 41.15]], "keep_status": [false, true, false, false, false, true, true], "silence_prob": [0.0, 46.9, 0.0, 0.0, 31.49, 41.52, 33.4], "audiomae_on_audioset": [null, [["frog", 48.08], ["quack", 10.81], ["croak", 6.95]], null, null, [["speech", 46.04], ["music", 31.12], ["hum", 6.86]], [["hum", 24.8], ["mains hum", 24.08], ["sidetone", 15.38]], [["music", 40.7], ["buzz", 9.83], ["bee, wasp, etc.", 7.57]]], "duration": [0.84, 15.29, 0.92, 1.41, 4.38, 2.5, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/v5wBisDJJ5A_filtered.json b/annotations_filtered/v5wBisDJJ5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d21d48f1674b34ba0fcdf08bb3e13b1d86d8fb0b --- /dev/null +++ b/annotations_filtered/v5wBisDJJ5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 111.13], [114.0, 115.43]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [60.13, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/v6bD23vEigE_filtered.json b/annotations_filtered/v6bD23vEigE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c7621901d72cbf1e848a5813b25cb48fc67973 --- /dev/null +++ b/annotations_filtered/v6bD23vEigE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [9.0, 17.49], [21.0, 26.97], [28.0, 30.42], [31.0, 32.71], [33.0, 34.99], [38.0, 50.92], [52.0, 70.83], [72.0, 72.47], [73.0, 81.35], [83.0, 84.84], [85.0, 89.61], [90.0, 92.55], [94.0, 95.91], [97.0, 97.53], [99.0, 104.77], [106.0, 107.7], [108.0, 109.61], [110.0, 113.73], [115.0, 116.31], [119.0, 124.98], [126.0, 127.36], [129.0, 132.44], [133.0, 133.73], [135.0, 135.89], [137.0, 137.84], [139.0, 141.17], [142.0, 146.15], [147.0, 150.01], [152.0, 152.68], [154.0, 157.33], [159.0, 162.36], [164.0, 166.45], [168.0, 170.5], [172.0, 183.71]], "keep_status": [false, true, false, true, false, false, true, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.96, 49.36, 48.02, 0.0, 0.0, 36.31, 45.92, 0.0, 55.31, 0.0, 44.29, 48.91, 0.0, 0.0, 57.64, 0.0, 0.0, 50.26, 0.0, 50.81, 0.0, 52.39, 0.0, 0.0, 0.0, 55.74, 47.12, 51.12, 0.0, 51.34, 50.56, 36.33, 53.28, 54.1], "audiomae_on_audioset": [null, [["speech", 28.02], ["hum", 17.05], ["music", 12.28]], [["theremin", 55.23], ["music", 23.87], ["whale vocalization", 2.36]], [["music", 42.48], ["hum", 5.52], ["throbbing", 4.68]], null, null, [["music", 54.84], ["theremin", 9.92], ["ambient music", 5.13]], [["music", 57.47], ["bee, wasp, etc.", 4.37], ["ambient music", 4.03]], null, null, null, [["speech", 33.46], ["music", 18.81], ["didgeridoo", 5.57]], [["music", 29.53], ["speech", 17.61], ["pulse", 7.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.25], ["theremin", 25.72], ["hum", 7.05]], null, null, null, null, [["music", 20.86], ["speech", 6.4], ["mains hum", 6.18]], null, null], "duration": [0.62, 8.49, 5.97, 2.42, 1.71, 1.99, 12.92, 18.83, 0.47, 8.35, 1.84, 4.61, 2.55, 1.91, 0.53, 5.77, 1.7, 1.61, 3.73, 1.31, 5.98, 1.36, 3.44, 0.73, 0.89, 0.84, 2.17, 4.15, 3.01, 0.68, 3.33, 3.36, 2.45, 2.5, 11.71]} \ No newline at end of file diff --git a/annotations_filtered/v71Epv4g6jY_filtered.json b/annotations_filtered/v71Epv4g6jY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a11fae64956c3cdb854bb485585e91c7fde62a3 --- /dev/null +++ b/annotations_filtered/v71Epv4g6jY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.02], [7.0, 10.72], [13.0, 13.68], [18.0, 20.44], [23.0, 25.56], [27.0, 31.89], [36.0, 38.25], [41.0, 41.5], [42.0, 41.57], [42.0, 41.64], [42.0, 42.8], [43.0, 44.24], [46.0, 46.01], [46.0, 47.28], [48.0, 49.08], [50.0, 51.33], [56.0, 56.73], [59.0, 65.57], [69.0, 71.41], [73.0, 76.67], [79.0, 82.71], [85.0, 86.24], [87.0, 87.37], [91.0, 95.05], [97.0, 97.71], [100.0, 100.25], [100.0, 100.79], [102.0, 102.15], [103.0, 103.2], [105.0, 107.81], [110.0, 114.52], [116.0, 118.03], [120.0, 125.79]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [44.04, 39.22, 0.0, 44.87, 41.81, 37.51, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 37.39, 79.24, 55.18, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 0.0, 0.0, 36.98, 34.44, 41.76, 33.54], "audiomae_on_audioset": [[["telephone", 28.12], ["telephone bell ringing", 13.2], ["creak", 8.38]], [["speech", 49.33], ["music", 19.94], ["wind instrument, woodwind instrument", 2.99]], null, [["music", 18.85], ["musical instrument", 3.22], ["speech", 2.63]], [["sine wave", 55.61], ["chirp tone", 10.36], ["sidetone", 5.29]], [["music", 36.51], ["theremin", 35.33], ["speech", 5.56]], [["theremin", 53.29], ["music", 32.04], ["musical instrument", 2.71]], null, null, null, null, null, null, null, null, null, null, [["radio", 44.1], ["speech", 17.52], ["noise", 8.53]], [["whale vocalization", 16.36], ["music", 13.91], ["speech", 6.08]], null, null, null, null, [["music", 37.96], ["theremin", 23.03], ["whale vocalization", 4.35]], null, null, null, null, null, [["speech", 38.68], ["music", 24.39], ["gong", 10.82]], [["burping, eructation", 52.09], ["grunt", 24.7], ["speech", 9.05]], [["music", 21.59], ["synthesizer", 21.01], ["chirp tone", 11.34]], [["noise", 26.51], ["whale vocalization", 19.04], ["hum", 11.58]]], "duration": [2.02, 3.72, 0.68, 2.44, 2.56, 4.89, 2.25, 0.5, -0.43, -0.36, 0.8, 1.24, 0.01, 1.28, 1.08, 1.33, 0.73, 6.57, 2.41, 3.67, 3.71, 1.24, 0.37, 4.05, 0.71, 0.25, 0.79, 0.15, 0.2, 2.81, 4.52, 2.03, 5.79]} \ No newline at end of file diff --git a/annotations_filtered/v757jrOBkng_filtered.json b/annotations_filtered/v757jrOBkng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b59056a3b740953d0e9fe037b67fa925dd76dff --- /dev/null +++ b/annotations_filtered/v757jrOBkng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [5.0, 5.21], [7.0, 8.34], [11.0, 11.64], [14.0, 14.91], [18.0, 17.91], [22.0, 22.67], [24.0, 24.73], [28.0, 28.93], [31.0, 30.91], [41.0, 42.6], [44.0, 44.51], [45.0, 45.81], [51.0, 51.41], [56.0, 58.23], [60.0, 60.52], [61.0, 61.64], [65.0, 67.07], [68.0, 70.16], [71.0, 73.67], [78.0, 78.54], [82.0, 84.0], [85.0, 96.85], [98.0, 99.59], [100.0, 102.25], [103.0, 105.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.78, 99.56, 0.0, 100.0, 97.54, 0.0, 97.54, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.21, 1.34, 0.64, 0.91, -0.09, 0.67, 0.73, 0.93, -0.09, 1.6, 0.51, 0.81, 0.41, 2.23, 0.52, 0.64, 2.07, 2.16, 2.67, 0.54, 2.0, 11.85, 1.59, 2.25, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/v79foBIrar4_filtered.json b/annotations_filtered/v79foBIrar4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73d3d119dc4fc6ea49c5d91b729300fb184fb9f5 --- /dev/null +++ b/annotations_filtered/v79foBIrar4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.59], [15.0, 17.15], [18.0, 65.06], [66.0, 67.81], [69.0, 82.32], [83.0, 85.53], [86.0, 86.86], [88.0, 90.46], [91.0, 93.77], [94.0, 94.26], [94.0, 102.27], [104.0, 104.92], [106.0, 108.21], [109.0, 110.96], [112.0, 115.43], [117.0, 119.01], [120.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 79.76, 100.0, 0.0, 100.0, 100.0, 0.0, 68.28, 0.0, 94.95, 0.0, 87.37, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 2.15, 47.06, 1.81, 13.32, 2.53, 0.86, 2.46, 2.77, 0.26, 8.27, 0.92, 2.21, 1.96, 3.43, 2.01, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/v7FL42Fon3g_filtered.json b/annotations_filtered/v7FL42Fon3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6980b3056ea9766895309deeef5c7077a1ffac33 --- /dev/null +++ b/annotations_filtered/v7FL42Fon3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.81], [7.0, 7.62], [12.0, 45.86], [47.0, 47.46], [50.0, 50.23], [51.0, 51.49], [53.0, 75.3], [80.0, 89.58], [91.0, 91.45], [93.0, 93.33], [94.0, 95.69], [97.0, 97.55], [100.0, 101.29], [107.0, 108.9], [111.0, 116.65], [117.0, 116.73], [117.0, 118.54], [120.0, 120.34], [123.0, 124.28], [125.0, 126.2], [128.0, 130.0], [131.0, 131.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.65, 34.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.34, 0.0, 0.0, 0.0, 0.0, 0.0, 37.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 66.7], ["musical instrument", 3.49], ["hum", 2.58]], [["music", 67.64], ["musical instrument", 9.75], ["didgeridoo", 2.93]], null, null, null, null, null, null, [["music", 30.43], ["musical instrument", 13.88], ["brass instrument", 11.07]], null, null, null, null, null, [["music", 27.5], ["didgeridoo", 12.5], ["fart", 8.96]], null], "duration": [0.81, 0.62, 33.86, 0.46, 0.23, 0.49, 22.3, 9.58, 0.45, 0.33, 1.69, 0.55, 1.29, 1.9, 5.65, -0.27, 1.54, 0.34, 1.28, 1.2, 2.0, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/v7QfNBfZT3w_filtered.json b/annotations_filtered/v7QfNBfZT3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08c9965c77f0ccb45512bbf5131f9a7b4cc85d1c --- /dev/null +++ b/annotations_filtered/v7QfNBfZT3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.79], [8.0, 9.63], [12.0, 14.23], [16.0, 22.25], [23.0, 24.68], [32.0, 33.12], [33.0, 36.98], [43.0, 44.93], [51.0, 55.75], [57.0, 56.61], [58.0, 59.66], [63.0, 63.34], [65.0, 66.7], [67.0, 68.59], [70.0, 71.66], [73.0, 73.63], [76.0, 76.71], [82.0, 83.0], [83.0, 84.01], [85.0, 93.46], [95.0, 96.53], [98.0, 99.91], [106.0, 108.23], [114.0, 115.6], [117.0, 117.14], [119.0, 119.4], [121.0, 122.12], [122.0, 122.79], [124.0, 125.31], [129.0, 129.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.0, 45.33, 0.0, 0.0, 45.95, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 44.94], ["sidetone", 34.97], ["music", 4.37]], null, null, [["speech", 87.04], ["sidetone", 4.5], ["inside, small room", 0.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.63, 2.23, 6.25, 1.68, 1.12, 3.98, 1.93, 4.75, -0.39, 1.66, 0.34, 1.7, 1.59, 1.66, 0.63, 0.71, 1.0, 1.01, 8.46, 1.53, 1.91, 2.23, 1.6, 0.14, 0.4, 1.12, 0.79, 1.31, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/v7kRQXWpSdE_filtered.json b/annotations_filtered/v7kRQXWpSdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..623d7a4819e3a1fb0e19c532c774d12532684824 --- /dev/null +++ b/annotations_filtered/v7kRQXWpSdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.21], [10.0, 20.06], [20.0, 52.0]], "keep_status": [false, false, false], "silence_prob": [99.99, 86.64, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [2.21, 10.06, 32.0]} \ No newline at end of file diff --git a/annotations_filtered/v8CflcvxDJo_filtered.json b/annotations_filtered/v8CflcvxDJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d14d110542819689e04bea035e8de354cb45e1d --- /dev/null +++ b/annotations_filtered/v8CflcvxDJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 59.98], [61.0, 69.15], [70.0, 73.33], [78.0, 77.85], [80.0, 80.13], [84.0, 83.69], [85.0, 89.61], [94.0, 105.24], [106.0, 107.28], [109.0, 151.95]], "keep_status": [false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.54, 30.03, 0.0, 0.0, 0.0, 30.58, 31.69, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 28.4], ["animal", 9.4], ["hum", 3.95]], [["livestock, farm animals, working animals", 20.57], ["moo", 19.82], ["cattle, bovinae", 15.91]], null, null, null, [["music", 61.08], ["throbbing", 9.42], ["electronic music", 4.53]], [["music", 49.63], ["hum", 10.14], ["throbbing", 10.03]], null, null], "duration": [46.98, 8.15, 3.33, -0.15, 0.13, -0.31, 4.61, 11.24, 1.28, 42.95]} \ No newline at end of file diff --git a/annotations_filtered/v8KA0GieSoE_filtered.json b/annotations_filtered/v8KA0GieSoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f55d3f5821309d62e94358c9fcf33ca51ea61940 --- /dev/null +++ b/annotations_filtered/v8KA0GieSoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 89.04]], "keep_status": [false], "silence_prob": [30.93], "audiomae_on_audioset": [[["speech", 57.23], ["music", 25.87], ["musical instrument", 1.8]]], "duration": [4.04]} \ No newline at end of file diff --git a/annotations_filtered/v8OMHtUg9sU_filtered.json b/annotations_filtered/v8OMHtUg9sU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20dc1edf3604762bac8ec402cef3e6153378ea7a --- /dev/null +++ b/annotations_filtered/v8OMHtUg9sU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 74.06], [75.0, 75.54], [76.0, 77.87], [85.0, 84.72], [86.0, 87.03], [120.0, 120.23]], "keep_status": [false, false, false, false, false, false], "silence_prob": [33.52, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.81], ["boing", 30.93], ["music", 4.48]], null, null, null, null, null], "duration": [17.06, 0.54, 1.87, -0.28, 1.03, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/v8UDjwdqzKY_filtered.json b/annotations_filtered/v8UDjwdqzKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33f7d3fcdc51ddc3a1b99112aef728c10b590bba --- /dev/null +++ b/annotations_filtered/v8UDjwdqzKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [7.0, 6.64], [7.0, 7.87], [9.0, 9.48], [13.0, 13.1], [22.0, 21.74], [29.0, 29.0], [30.0, 30.5], [32.0, 31.73], [33.0, 33.49], [38.0, 38.1], [46.0, 47.51], [49.0, 49.67], [51.0, 52.24], [54.0, 53.82], [55.0, 57.06], [59.0, 61.65], [63.0, 63.71], [64.0, 64.89], [65.0, 65.85], [67.0, 68.22], [69.0, 69.77], [71.0, 70.85], [72.0, 72.74], [74.0, 74.56], [86.0, 85.97], [88.0, 88.62], [91.0, 90.91], [92.0, 92.15], [98.0, 98.22], [101.0, 100.79], [102.0, 102.98], [105.0, 105.66], [115.0, 117.04], [118.0, 117.98], [119.0, 119.74], [120.0, 124.21], [127.0, 129.2], [131.0, 132.65], [134.0, 134.2], [135.0, 136.09], [137.0, 137.44], [138.0, 139.19], [140.0, 140.39], [141.0, 141.45], [142.0, 143.72], [144.0, 144.83], [146.0, 147.26], [148.0, 148.63], [150.0, 151.36], [152.0, 153.45], [154.0, 155.34], [157.0, 157.84], [160.0, 161.23], [162.0, 162.23], [165.0, 165.37], [166.0, 166.08], [167.0, 167.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, -0.36, 0.87, 0.48, 0.1, -0.26, 0.0, 0.5, -0.27, 0.49, 0.1, 1.51, 0.67, 1.24, -0.18, 2.06, 2.65, 0.71, 0.89, 0.85, 1.22, 0.77, -0.15, 0.74, 0.56, -0.03, 0.62, -0.09, 0.15, 0.22, -0.21, 0.98, 0.66, 2.04, -0.02, 0.74, 4.21, 2.2, 1.65, 0.2, 1.09, 0.44, 1.19, 0.39, 0.45, 1.72, 0.83, 1.26, 0.63, 1.36, 1.45, 1.34, 0.84, 1.23, 0.23, 0.37, 0.08, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/v8c2XZdCS_A_filtered.json b/annotations_filtered/v8c2XZdCS_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd9f62af1455bae9eded58a137b79b0b63b5eafa --- /dev/null +++ b/annotations_filtered/v8c2XZdCS_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.62], [16.0, 16.8], [20.0, 21.0], [25.0, 25.59], [30.0, 30.74], [41.0, 41.5], [43.0, 43.58], [46.0, 46.21], [67.0, 67.31], [69.0, 68.74], [69.0, 72.59], [78.0, 78.63], [82.0, 83.93], [86.0, 86.32], [88.0, 88.65], [92.0, 92.74], [96.0, 96.97], [99.0, 99.01], [104.0, 104.5], [108.0, 109.46], [113.0, 119.16]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.11], "audiomae_on_audioset": [[["music", 47.53], ["speech", 14.6], ["boing", 6.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.62, 0.8, 1.0, 0.59, 0.74, 0.5, 0.58, 0.21, 0.31, -0.26, 3.59, 0.63, 1.93, 0.32, 0.65, 0.74, 0.97, 0.01, 0.5, 1.46, 6.16]} \ No newline at end of file diff --git a/annotations_filtered/v8kB6cqv8qM_filtered.json b/annotations_filtered/v8kB6cqv8qM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cfb11381f3badc50490197d381fde2ee0cf681d --- /dev/null +++ b/annotations_filtered/v8kB6cqv8qM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.96], [15.0, 15.16], [22.0, 24.29], [27.0, 29.46], [32.0, 32.43], [37.0, 36.98], [42.0, 51.6], [53.0, 73.82], [82.0, 83.1], [84.0, 89.33], [97.0, 97.36], [104.0, 118.69], [121.0, 121.44]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 82.79, 31.82, 0.0, 0.0, 29.89, 29.8, 0.0, 29.97, 0.0, 29.17, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 16.07], ["music", 12.84], ["insect", 7.78]], null, null, [["speech", 61.56], ["electric shaver, electric razor", 15.77], ["music", 5.77]], [["music", 25.11], ["mains hum", 16.52], ["hum", 16.09]], null, [["throbbing", 28.66], ["music", 26.08], ["hum", 23.75]], null, [["hum", 23.21], ["speech", 22.39], ["music", 15.66]], null], "duration": [0.96, 0.16, 2.29, 2.46, 0.43, -0.02, 9.6, 20.82, 1.1, 5.33, 0.36, 14.69, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/v96ND45Aqmo_filtered.json b/annotations_filtered/v96ND45Aqmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9a8285a1496bd4ca9fbb2aab09f8a53030b1fdc --- /dev/null +++ b/annotations_filtered/v96ND45Aqmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.21], [16.0, 16.95], [19.0, 19.74], [21.0, 22.3], [24.0, 25.35], [26.0, 26.64], [31.0, 31.53], [32.0, 33.49], [35.0, 34.75], [39.0, 40.15], [41.0, 42.11], [44.0, 44.27], [51.0, 60.72], [66.0, 66.7], [67.0, 68.08], [79.0, 80.81], [81.0, 82.54], [85.0, 87.81], [88.0, 93.16], [95.0, 98.37], [103.0, 102.98], [104.0, 108.01], [110.0, 110.12], [112.0, 112.01], [114.0, 114.47], [117.0, 121.37], [123.0, 125.91], [126.0, 128.61], [136.0, 147.88], [150.0, 152.85], [153.0, 164.69], [167.0, 169.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 94.22, 62.68, 96.66, 0.0, 95.37, 0.0, 0.0, 0.0, 92.15, 83.52, 85.17, 34.33, 58.13, 46.57, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.94], ["throbbing", 25.43], ["hum", 15.23]], null, [["music", 46.51], ["hum", 11.21], ["throbbing", 9.94]], null], "duration": [0.21, 0.95, 0.74, 1.3, 1.35, 0.64, 0.53, 1.49, -0.25, 1.15, 1.11, 0.27, 9.72, 0.7, 1.08, 1.81, 1.54, 2.81, 5.16, 3.37, -0.02, 4.01, 0.12, 0.01, 0.47, 4.37, 2.91, 2.61, 11.88, 2.85, 11.69, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/v98Rh9qzmPs_filtered.json b/annotations_filtered/v98Rh9qzmPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1239f38416c4e1193320260536041767dec8338 --- /dev/null +++ b/annotations_filtered/v98Rh9qzmPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.53], [10.0, 11.79], [13.0, 14.32], [15.0, 38.23], [39.0, 39.61], [40.0, 41.18], [44.0, 46.04], [47.0, 49.44], [64.0, 65.57], [69.0, 72.08], [76.0, 80.25], [81.0, 91.44], [99.0, 99.82], [100.0, 101.98], [107.0, 120.63], [123.0, 133.74], [135.0, 159.21], [160.0, 160.83], [164.0, 165.3], [167.0, 180.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [35.87, 0.0, 0.0, 29.47, 0.0, 0.0, 28.58, 29.61, 0.0, 35.91, 32.88, 31.92, 0.0, 0.0, 31.57, 37.55, 39.04, 0.0, 0.0, 61.57], "audiomae_on_audioset": [[["rumble", 32.66], ["hum", 17.93], ["throbbing", 11.46]], null, null, [["hum", 69.95], ["mains hum", 13.1], ["throbbing", 11.39]], null, null, [["bow-wow", 44.89], ["dog", 19.01], ["bark", 10.62]], [["whale vocalization", 57.75], ["speech", 17.92], ["hum", 10.21]], null, [["speech", 65.3], ["eruption", 4.22], ["clip-clop", 3.72]], [["hum", 58.28], ["throbbing", 19.15], ["mains hum", 5.31]], [["hum", 43.85], ["throbbing", 14.36], ["noise", 7.84]], null, null, [["hum", 36.14], ["mains hum", 15.58], ["music", 7.19]], [["hum", 45.26], ["mains hum", 31.36], ["throbbing", 6.13]], [["music", 54.8], ["hum", 8.86], ["ambient music", 6.78]], null, null, null], "duration": [7.53, 1.79, 1.32, 23.23, 0.61, 1.18, 2.04, 2.44, 1.57, 3.08, 4.25, 10.44, 0.82, 1.98, 13.63, 10.74, 24.21, 0.83, 1.3, 13.1]} \ No newline at end of file diff --git a/annotations_filtered/v9Cq9nThaNs_filtered.json b/annotations_filtered/v9Cq9nThaNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb489d1a7cf1e6be6c3466eb90cb221a727845d1 --- /dev/null +++ b/annotations_filtered/v9Cq9nThaNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.72], [1.0, 12.21], [12.0, 12.28], [17.0, 24.88], [30.0, 29.81], [31.0, 40.74], [43.0, 43.87], [55.0, 63.54], [66.0, 66.82], [70.0, 71.88], [74.0, 75.09], [76.0, 76.45], [79.0, 83.39], [85.0, 100.45], [112.0, 131.36], [136.0, 148.69], [153.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 28.89, 0.0, 28.29, 0.0, 28.95, 0.0, 28.96, 0.0, 0.0, 0.0, 0.0, 29.44, 29.4, 29.07, 29.01, 28.85], "audiomae_on_audioset": [null, [["speech", 51.24], ["music", 21.72], ["vehicle", 5.8]], null, [["vehicle", 34.74], ["music", 18.36], ["car", 18.32]], null, [["music", 47.78], ["speech", 14.1], ["hum", 12.5]], null, [["music", 65.09], ["throbbing", 17.14], ["hum", 7.18]], null, null, null, null, [["music", 81.71], ["throbbing", 4.16], ["electronic music", 3.46]], [["music", 27.94], ["vehicle", 26.41], ["car", 12.19]], [["music", 65.13], ["throbbing", 11.17], ["hum", 7.84]], [["music", 62.36], ["throbbing", 13.21], ["hum", 8.34]], [["music", 48.27], ["throbbing", 21.01], ["hum", 16.25]]], "duration": [-0.28, 11.21, 0.28, 7.88, -0.19, 9.74, 0.87, 8.54, 0.82, 1.88, 1.09, 0.45, 4.39, 15.45, 19.36, 12.69, 25.12]} \ No newline at end of file diff --git a/annotations_filtered/v9UIDDlnSgA_filtered.json b/annotations_filtered/v9UIDDlnSgA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0fb84bbddab782eb9cf62b70978bb700dd1432 --- /dev/null +++ b/annotations_filtered/v9UIDDlnSgA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.01], [18.0, 18.39], [18.0, 29.25], [30.0, 40.29], [45.0, 73.36], [74.0, 107.38]], "keep_status": [false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.35, 28.86, 29.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.36], ["theremin", 10.22], ["whale vocalization", 5.14]], [["speech", 59.31], ["explosion", 5.54], ["hubbub, speech noise, speech babble", 3.71]], [["music", 47.24], ["speech", 15.06], ["vehicle", 5.97]], null], "duration": [1.01, 0.39, 11.25, 10.29, 28.36, 33.38]} \ No newline at end of file diff --git a/annotations_filtered/v9pZdy4lZ7U_filtered.json b/annotations_filtered/v9pZdy4lZ7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb01741eabfbcfbd8536cf51a4d060c607c9b0ab --- /dev/null +++ b/annotations_filtered/v9pZdy4lZ7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [8.0, 10.94], [12.0, 13.9], [16.0, 20.75], [23.0, 24.53], [26.0, 27.65], [32.0, 44.31], [45.0, 45.74], [46.0, 45.81], [46.0, 46.94], [47.0, 46.99], [47.0, 54.43], [58.0, 78.21], [81.0, 84.97], [85.0, 91.64], [97.0, 132.17], [132.0, 132.68], [133.0, 149.98], [150.0, 150.01]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.84, 0.0, 31.67, 0.0, 0.0, 29.46, 0.0, 0.0, 0.0, 0.0, 29.86, 29.72, 29.42, 29.28, 0.0, 0.0, 30.7, 0.0], "audiomae_on_audioset": [null, [["music", 34.91], ["throbbing", 7.14], ["speech", 5.11]], null, [["fly, housefly", 46.28], ["mosquito", 25.69], ["insect", 6.8]], null, null, [["music", 22.32], ["buzz", 6.24], ["rumble", 5.89]], null, null, null, null, [["sound effect", 34.22], ["grunt", 17.69], ["speech", 16.26]], [["hum", 29.74], ["speech", 25.19], ["throbbing", 16.38]], [["hum", 37.56], ["mains hum", 30.12], ["rumble", 6.93]], [["whale vocalization", 48.34], ["hum", 13.01], ["music", 8.66]], null, null, [["music", 34.04], ["hum", 19.38], ["theremin", 19.05]], null], "duration": [0.41, 2.94, 1.9, 4.75, 1.53, 1.65, 12.31, 0.74, -0.19, 0.94, -0.01, 7.43, 20.21, 3.97, 6.64, 35.17, 0.68, 16.98, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/v9qbXZZD-b0_filtered.json b/annotations_filtered/v9qbXZZD-b0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c4354d2d385ebef7787d87c45eae40e441a80a6 --- /dev/null +++ b/annotations_filtered/v9qbXZZD-b0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 37.45], [39.0, 57.42], [59.0, 67.88], [70.0, 70.44], [72.0, 72.23], [74.0, 79.08], [80.0, 87.96], [89.0, 92.65], [94.0, 95.66], [97.0, 97.73], [99.0, 100.47], [102.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.96, 33.24, 63.96, 0.0, 0.0, 98.19, 89.72, 96.66, 0.0, 0.0, 0.0, 39.67], "audiomae_on_audioset": [[["music", 54.0], ["speech", 40.23], ["outside, rural or natural", 0.61]], [["cattle, bovinae", 51.75], ["livestock, farm animals, working animals", 30.58], ["moo", 13.83]], null, null, null, null, null, null, null, null, null, [["speech", 32.49], ["explosion", 13.41], ["sidetone", 6.26]]], "duration": [18.45, 18.42, 8.88, 0.44, 0.23, 5.08, 7.96, 3.65, 1.66, 0.73, 1.47, 5.86]} \ No newline at end of file diff --git a/annotations_filtered/vA1fVHBWuBU_filtered.json b/annotations_filtered/vA1fVHBWuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..594e6bf3278ae44df451298d83adcc84a1d7f7f4 --- /dev/null +++ b/annotations_filtered/vA1fVHBWuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [14.0, 14.57], [19.0, 18.76], [45.0, 45.2], [58.0, 58.21], [66.0, 67.0], [69.0, 69.8], [72.0, 75.91], [78.0, 78.09], [80.0, 80.49], [84.0, 84.3], [86.0, 86.7], [88.0, 89.9], [92.0, 96.15], [99.0, 100.58], [105.0, 106.89], [111.0, 111.96], [113.0, 114.52], [116.0, 117.75], [121.0, 123.45], [126.0, 128.24], [132.0, 134.76], [136.0, 138.52], [139.0, 140.16], [145.0, 146.06], [150.0, 151.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 99.98, 99.4, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.57, -0.24, 0.2, 0.21, 1.0, 0.8, 3.91, 0.09, 0.49, 0.3, 0.7, 1.9, 4.15, 1.58, 1.89, 0.96, 1.52, 1.75, 2.45, 2.24, 2.76, 2.52, 1.16, 1.06, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/vAYzTJIog1U_filtered.json b/annotations_filtered/vAYzTJIog1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fd914d012df6c0f456e500ed83013240b9a811f --- /dev/null +++ b/annotations_filtered/vAYzTJIog1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 25.37], [27.0, 27.9], [31.0, 33.64], [41.0, 41.82], [44.0, 44.49]], "keep_status": [true, false, true, false, false], "silence_prob": [40.84, 0.0, 30.29, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 27.3], ["speech", 14.48], ["music", 14.25]], null, [["sheep", 27.29], ["livestock, farm animals, working animals", 21.1], ["bleat", 13.89]], null, null], "duration": [15.37, 0.9, 2.64, 0.82, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/vAd0QlUaIBY_filtered.json b/annotations_filtered/vAd0QlUaIBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38cffbb9deb0efba49017553f9870f5e3f433441 --- /dev/null +++ b/annotations_filtered/vAd0QlUaIBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.11], [8.0, 9.59], [11.0, 13.9], [17.0, 16.8], [17.0, 18.64], [21.0, 21.03], [21.0, 21.74], [22.0, 22.42], [25.0, 27.23], [30.0, 31.06], [36.0, 36.22], [47.0, 47.7], [49.0, 49.91], [55.0, 55.22], [64.0, 64.1], [66.0, 65.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.43, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 1.59, 2.9, -0.2, 1.64, 0.03, 0.74, 0.42, 2.23, 1.06, 0.22, 0.7, 0.91, 0.22, 0.1, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/vAyq-3z1SYo_filtered.json b/annotations_filtered/vAyq-3z1SYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8843165a70ecec0801f53cc50c9c5d7f2c43d27 --- /dev/null +++ b/annotations_filtered/vAyq-3z1SYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.62], [16.0, 19.18], [20.0, 21.59], [23.0, 26.16], [29.0, 32.37], [34.0, 35.95], [37.0, 39.53], [40.0, 44.22], [45.0, 93.82]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [98.73, 99.31, 0.0, 97.22, 99.48, 0.0, 99.16, 99.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.62, 3.18, 1.59, 3.16, 3.37, 1.95, 2.53, 4.22, 48.82]} \ No newline at end of file diff --git a/annotations_filtered/vBAK4o8zHF4_filtered.json b/annotations_filtered/vBAK4o8zHF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c7d42d98ac3eea5580835776d9c5ee64719e1d5 --- /dev/null +++ b/annotations_filtered/vBAK4o8zHF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.15], [17.0, 17.49], [32.0, 33.2], [35.0, 36.71], [48.0, 48.59], [51.0, 52.42], [53.0, 53.65], [58.0, 64.56], [67.0, 72.13], [73.0, 74.28], [97.0, 103.69], [107.0, 108.78], [111.0, 119.45], [120.0, 125.46], [127.0, 127.7], [128.0, 132.43], [134.0, 136.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 50.97, 0.0, 39.66, 0.0, 39.82, 35.59, 0.0, 35.09, 37.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 46.58], ["boing", 41.49], ["speech", 9.08]], null, [["music", 55.21], ["speech", 18.86], ["boing", 4.82]], [["music", 63.53], ["fly, housefly", 6.23], ["mosquito", 4.29]], null, [["speech", 40.18], ["music", 18.91], ["synthesizer", 2.85]], [["music", 23.06], ["throbbing", 14.66], ["hum", 8.53]]], "duration": [0.15, 0.49, 1.2, 1.71, 0.59, 1.42, 0.65, 6.56, 5.13, 1.28, 6.69, 1.78, 8.45, 5.46, 0.7, 4.43, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/vBLcmGPbryg_filtered.json b/annotations_filtered/vBLcmGPbryg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c7c583551412519d6c0a02e4f65f65478e0f2d7 --- /dev/null +++ b/annotations_filtered/vBLcmGPbryg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [7.0, 7.37], [19.0, 20.98], [38.0, 40.85], [42.0, 43.82], [66.0, 66.53], [77.0, 84.5], [88.0, 88.72], [92.0, 91.79], [94.0, 94.56], [97.0, 100.67], [104.0, 107.1], [110.0, 117.42], [127.0, 132.38], [134.0, 167.97], [168.0, 168.64], [172.0, 172.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.22, 0.0, 0.0, 41.54, 0.0, 0.0, 0.0, 35.89, 29.42, 30.44, 29.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.69], ["electronic music", 5.48], ["trance music", 5.03]], null, null, null, [["music", 57.14], ["hum", 5.43], ["throbbing", 4.71]], [["music", 25.43], ["crowd", 20.67], ["cheering", 6.77]], [["music", 63.15], ["didgeridoo", 8.18], ["groan", 2.27]], [["music", 18.38], ["crowd", 9.88], ["groan", 7.2]], null, null, null], "duration": [0.2, 0.37, 1.98, 2.85, 1.82, 0.53, 7.5, 0.72, -0.21, 0.56, 3.67, 3.1, 7.42, 5.38, 33.97, 0.64, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/vBhBkvkofjk_filtered.json b/annotations_filtered/vBhBkvkofjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df0c05f78ef8ca67613929c0781c9b35a290a060 --- /dev/null +++ b/annotations_filtered/vBhBkvkofjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 5.22], [6.0, 28.27], [32.0, 32.9], [36.0, 35.68], [37.0, 41.34], [42.0, 43.8], [45.0, 46.5], [48.0, 48.09], [48.0, 48.76], [49.0, 49.2], [51.0, 52.47], [54.0, 54.23], [55.0, 55.34], [56.0, 56.47], [60.0, 60.56], [62.0, 64.91], [66.0, 66.8], [67.0, 67.61], [68.0, 68.25], [69.0, 69.33], [73.0, 94.29], [98.0, 97.97], [102.0, 102.51], [103.0, 103.32], [106.0, 105.81], [107.0, 109.78], [111.0, 112.08], [112.0, 112.41], [114.0, 113.78]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.94, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.72, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 13.78], ["explosion", 9.38], ["eruption", 7.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 32.2], ["moo", 22.69], ["livestock, farm animals, working animals", 15.64]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.22, 22.27, 0.9, -0.32, 4.34, 1.8, 1.5, 0.09, 0.76, 0.2, 1.47, 0.23, 0.34, 0.47, 0.56, 2.91, 0.8, 0.61, 0.25, 0.33, 21.29, -0.03, 0.51, 0.32, -0.19, 2.78, 1.08, 0.41, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/vBtG9eqgf2Q_filtered.json b/annotations_filtered/vBtG9eqgf2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6e360268b0a6a5b36bf41a243ab7eea2fc70615 --- /dev/null +++ b/annotations_filtered/vBtG9eqgf2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 43.63], [47.0, 56.88], [59.0, 61.21], [62.0, 63.04], [65.0, 70.24], [72.0, 74.97], [77.0, 79.54], [90.0, 91.08], [96.0, 97.43], [103.0, 103.74], [104.0, 107.65], [108.0, 111.37], [112.0, 112.6], [113.0, 114.17], [115.0, 138.18], [144.0, 158.25], [161.0, 161.6], [163.0, 163.34], [164.0, 165.52], [167.0, 167.24], [168.0, 169.37], [170.0, 204.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.12, 57.32, 95.64, 0.0, 99.21, 99.98, 99.88, 0.0, 0.0, 0.0, 53.91, 45.65, 0.0, 0.0, 32.75, 31.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 91.19], ["throbbing", 1.75], ["electronic music", 0.54]], null, null, null, null, null, null, null, null, null, null, [["music", 68.54], ["synthesizer", 6.11], ["throbbing", 2.7]], null, null, [["music", 84.06], ["didgeridoo", 3.52], ["electronic music", 1.22]], [["music", 72.59], ["synthesizer", 5.75], ["speech", 4.84]], null, null, null, null, null, null], "duration": [29.63, 9.88, 2.21, 1.04, 5.24, 2.97, 2.54, 1.08, 1.43, 0.74, 3.65, 3.37, 0.6, 1.17, 23.18, 14.25, 0.6, 0.34, 1.52, 0.24, 1.37, 34.75]} \ No newline at end of file diff --git a/annotations_filtered/vCuU2y6qR2s_filtered.json b/annotations_filtered/vCuU2y6qR2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ba9bff96b08507136ee0bf8734943d4acd89d8b --- /dev/null +++ b/annotations_filtered/vCuU2y6qR2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [5.0, 7.79], [9.0, 8.87], [9.0, 10.23], [14.0, 15.43], [18.0, 19.41], [20.0, 20.41], [21.0, 21.71], [24.0, 25.32], [27.0, 27.11], [31.0, 31.19], [34.0, 35.18], [37.0, 37.72], [40.0, 41.96], [44.0, 45.71], [57.0, 58.45], [78.0, 78.85], [82.0, 85.68], [88.0, 89.63], [112.0, 117.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 0.0, 34.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 36.8], ["cattle, bovinae", 31.81], ["moo", 30.47]], null, [["livestock, farm animals, working animals", 19.06], ["fart", 9.35], ["crying, sobbing", 7.19]]], "duration": [1.45, 2.79, -0.13, 1.23, 1.43, 1.41, 0.41, 0.71, 1.32, 0.11, 0.19, 1.18, 0.72, 1.96, 1.71, 1.45, 0.85, 3.68, 1.63, 5.83]} \ No newline at end of file diff --git a/annotations_filtered/vD6FkjOtIIs_filtered.json b/annotations_filtered/vD6FkjOtIIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2ad4ab3b7e4b3b46190283420de0f131769e68e --- /dev/null +++ b/annotations_filtered/vD6FkjOtIIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.46], [6.0, 9.9], [11.0, 11.8], [13.0, 14.55], [16.0, 16.28], [17.0, 17.46], [21.0, 21.41], [29.0, 29.98], [34.0, 34.37], [38.0, 39.36], [41.0, 41.67], [43.0, 49.11], [52.0, 61.26], [62.0, 62.83], [65.0, 67.47], [69.0, 69.25], [71.0, 71.61], [72.0, 77.19], [79.0, 80.79], [83.0, 104.3], [106.0, 106.78], [108.0, 108.7], [111.0, 115.1], [116.0, 116.6], [119.0, 120.09], [121.0, 121.37], [122.0, 128.65], [131.0, 131.28], [134.0, 135.11], [136.0, 138.77], [139.0, 140.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.5, 32.94, 0.0, 34.96, 0.0, 0.0, 31.92, 0.0, 31.84, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 31.45, 0.0], "audiomae_on_audioset": [null, null, [["civil defense siren", 62.92], ["siren", 20.1], ["whale vocalization", 10.17]], null, null, null, null, null, null, null, null, null, [["music", 48.93], ["speech", 18.21], ["breaking", 13.29]], [["music", 34.53], ["speech", 19.09], ["fly, housefly", 11.99]], null, [["music", 27.92], ["speech", 18.23], ["didgeridoo", 15.6]], null, null, [["fly, housefly", 66.8], ["mosquito", 13.1], ["insect", 6.5]], null, [["music", 46.03], ["speech", 32.28], ["didgeridoo", 2.52]], null, null, null, null, null, null, [["music", 68.77], ["hum", 3.56], ["christmas music", 2.78]], null, null, [["music", 40.77], ["fly, housefly", 5.95], ["mosquito", 5.59]], null], "duration": [0.34, 0.46, 3.9, 0.8, 1.55, 0.28, 0.46, 0.41, 0.98, 0.37, 1.36, 0.67, 6.11, 9.26, 0.83, 2.47, 0.25, 0.61, 5.19, 1.79, 21.3, 0.78, 0.7, 4.1, 0.6, 1.09, 0.37, 6.65, 0.28, 1.11, 2.77, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/vDzbcWty6m0_filtered.json b/annotations_filtered/vDzbcWty6m0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93097e411e5b7fac331ed1905e1efde5aed92e46 --- /dev/null +++ b/annotations_filtered/vDzbcWty6m0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.34], [24.0, 24.51], [34.0, 34.69], [36.0, 38.97], [42.0, 44.81], [46.0, 47.55], [50.0, 50.95], [60.0, 61.42], [67.0, 74.04], [81.0, 81.21], [85.0, 86.39], [87.0, 89.16], [94.0, 94.66], [98.0, 98.74], [100.0, 104.45], [105.0, 105.43], [106.0, 106.35], [107.0, 108.26], [109.0, 109.63], [112.0, 111.97], [113.0, 116.36], [119.0, 120.99], [122.0, 125.56]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.61, 0.0, 0.0, 29.53, 66.63, 0.0, 0.0, 0.0, 30.61, 0.0, 0.0, 50.16, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 86.82], "audiomae_on_audioset": [[["music", 50.7], ["thunk", 11.2], ["effects unit", 4.77]], null, null, [["whack, thwack", 31.23], ["thump, thud", 19.15], ["speech", 5.09]], null, null, null, null, [["speech", 61.68], ["animal", 2.89], ["fart", 2.76]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.48], ["music", 23.02], ["beatboxing", 13.79]], null, null], "duration": [5.34, 0.51, 0.69, 2.97, 2.81, 1.55, 0.95, 1.42, 7.04, 0.21, 1.39, 2.16, 0.66, 0.74, 4.45, 0.43, 0.35, 1.26, 0.63, -0.03, 3.36, 1.99, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/vE0nmQGO4Hk_filtered.json b/annotations_filtered/vE0nmQGO4Hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0fe8ed7621d62f4fc3baf43dd18b4dc17dad3c3 --- /dev/null +++ b/annotations_filtered/vE0nmQGO4Hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.11], [12.0, 20.63], [23.0, 23.48], [24.0, 29.07], [31.0, 31.72], [40.0, 64.44], [64.0, 68.4], [70.0, 76.55], [80.0, 86.1], [87.0, 92.11], [92.0, 99.49], [100.0, 100.97], [103.0, 103.2]], "keep_status": [false, true, false, true, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 31.23, 0.0, 35.94, 0.0, 30.67, 32.66, 30.69, 30.29, 30.14, 38.3, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.7], ["music", 14.62], ["sonar", 10.14]], null, [["mains hum", 26.52], ["hum", 22.85], ["speech", 8.62]], null, [["music", 70.46], ["didgeridoo", 7.65], ["hum", 6.91]], [["music", 27.91], ["hum", 18.46], ["throbbing", 11.74]], [["music", 64.92], ["synthesizer", 6.55], ["didgeridoo", 4.22]], [["music", 32.11], ["throbbing", 16.24], ["hum", 14.99]], [["music", 28.72], ["breaking", 18.2], ["explosion", 4.34]], [["hum", 54.81], ["mains hum", 21.58], ["speech", 8.56]], null, null], "duration": [1.11, 8.63, 0.48, 5.07, 0.72, 24.44, 4.4, 6.55, 6.1, 5.11, 7.49, 0.97, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/vE8mFDabqD0_filtered.json b/annotations_filtered/vE8mFDabqD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4edad07107e6d5efb4a7e8e25e66c88d3235fcd4 --- /dev/null +++ b/annotations_filtered/vE8mFDabqD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 24.61], [25.0, 31.8], [33.0, 34.57], [35.0, 42.08], [42.0, 46.23], [47.0, 49.5], [50.0, 55.44], [58.0, 61.18], [67.0, 69.58], [76.0, 76.81], [82.0, 82.56], [85.0, 86.85], [87.0, 88.55], [89.0, 90.41], [91.0, 95.34], [107.0, 108.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [75.55, 78.89, 0.0, 75.55, 71.29, 79.07, 78.04, 64.86, 50.41, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 22.31], ["music", 19.91], ["mains hum", 15.11]], null], "duration": [17.61, 6.8, 1.57, 7.08, 4.23, 2.5, 5.44, 3.18, 2.58, 0.81, 0.56, 1.85, 1.55, 1.41, 4.34, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/vEDyFvKFcoQ_filtered.json b/annotations_filtered/vEDyFvKFcoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d53af0d4c8adda00f8cc7eb7e93f6fea84f1932 --- /dev/null +++ b/annotations_filtered/vEDyFvKFcoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [2.0, 2.86], [3.0, 3.84], [4.0, 4.99], [6.0, 6.61], [13.0, 13.95], [15.0, 15.45], [17.0, 17.44], [19.0, 20.71], [22.0, 22.35], [23.0, 23.19], [24.0, 26.77], [28.0, 30.5], [33.0, 33.3], [35.0, 35.24], [41.0, 42.62], [45.0, 46.16], [60.0, 60.02], [61.0, 62.01], [63.0, 67.54], [68.0, 70.65], [81.0, 83.3], [85.0, 86.66], [87.0, 87.02], [96.0, 103.52], [107.0, 108.23], [114.0, 115.89], [119.0, 120.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 93.6, 47.9, 0.0, 0.0, 75.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 19.05], ["music", 10.32], ["animal", 10.27]], null, null, null, null, null, null], "duration": [0.7, 0.86, 0.84, 0.99, 0.61, 0.95, 0.45, 0.44, 1.71, 0.35, 0.19, 2.77, 2.5, 0.3, 0.24, 1.62, 1.16, 0.02, 1.01, 4.54, 2.65, 2.3, 1.66, 0.02, 7.52, 1.23, 1.89, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/vEFoOcev00s_filtered.json b/annotations_filtered/vEFoOcev00s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0f9db688e36399f6846e3c7feacb32ae445a28 --- /dev/null +++ b/annotations_filtered/vEFoOcev00s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.01], [15.0, 16.33], [17.0, 19.99], [21.0, 23.58], [32.0, 34.21], [34.0, 35.13], [36.0, 38.37], [42.0, 44.12], [46.0, 50.97], [55.0, 56.42], [64.0, 78.75], [81.0, 82.93], [86.0, 120.56], [121.0, 121.88], [122.0, 129.56], [138.0, 142.11], [145.0, 146.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 0.0, 98.44, 99.98, 96.89, 0.0, 100.0, 98.99, 100.0, 0.0, 99.85, 0.0, 0.0, 0.0, 100.0, 57.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.01, 1.33, 2.99, 2.58, 2.21, 1.13, 2.37, 2.12, 4.97, 1.42, 14.75, 1.93, 34.56, 0.88, 7.56, 4.11, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/vETxuL7Ij3Q_filtered.json b/annotations_filtered/vETxuL7Ij3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3ab55dd08723bd1ba2a740049c825384e2dcf10 --- /dev/null +++ b/annotations_filtered/vETxuL7Ij3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [8.0, 10.88], [12.0, 15.85], [17.0, 19.62], [24.0, 28.09], [30.0, 37.49], [39.0, 39.06], [40.0, 45.76], [48.0, 49.47], [54.0, 54.8], [56.0, 57.5], [61.0, 76.81], [78.0, 78.9], [82.0, 83.35], [84.0, 91.59], [94.0, 98.34], [102.0, 103.77], [107.0, 112.31], [114.0, 115.69], [122.0, 122.05], [124.0, 124.71], [130.0, 130.35], [132.0, 135.53], [137.0, 137.05], [139.0, 140.44], [144.0, 149.54], [155.0, 161.49], [163.0, 163.66], [165.0, 166.82], [172.0, 172.56], [176.0, 179.95], [181.0, 182.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.85, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 2.88, 3.85, 2.62, 4.09, 7.49, 0.06, 5.76, 1.47, 0.8, 1.5, 15.81, 0.9, 1.35, 7.59, 4.34, 1.77, 5.31, 1.69, 0.05, 0.71, 0.35, 3.53, 0.05, 1.44, 5.54, 6.49, 0.66, 1.82, 0.56, 3.95, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/vEWPq-4sa3w_filtered.json b/annotations_filtered/vEWPq-4sa3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c2607dd87e883b6160836d9e83c6c8d28d8178 --- /dev/null +++ b/annotations_filtered/vEWPq-4sa3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 90.71]], "keep_status": [false], "silence_prob": [28.22], "audiomae_on_audioset": [[["music", 64.65], ["speech", 3.85], ["vehicle", 2.57]]], "duration": [20.71]} \ No newline at end of file diff --git a/annotations_filtered/vE_xjjCJWng_filtered.json b/annotations_filtered/vE_xjjCJWng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0b19f347ab27b9b56e305e466755cf5ef6b3768 --- /dev/null +++ b/annotations_filtered/vE_xjjCJWng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [5.0, 6.94], [8.0, 9.09], [11.0, 12.02], [15.0, 14.93], [20.0, 21.29], [23.0, 26.47], [27.0, 29.27], [30.0, 32.19], [33.0, 46.63], [48.0, 50.58], [52.0, 55.71], [57.0, 82.8], [84.0, 128.48]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.19, 99.56, 34.34, 30.77, 32.95, 31.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 37.76], ["music", 16.32], ["mains hum", 10.35]], [["music", 27.16], ["hum", 18.54], ["mains hum", 16.13]], [["music", 76.56], ["musical instrument", 3.33], ["theremin", 2.62]], [["music", 39.91], ["throbbing", 13.68], ["skidding", 8.53]], null], "duration": [1.48, 1.94, 1.09, 1.02, -0.07, 1.29, 3.47, 2.27, 2.19, 13.63, 2.58, 3.71, 25.8, 44.48]} \ No newline at end of file diff --git a/annotations_filtered/vEd2sU65NQI_filtered.json b/annotations_filtered/vEd2sU65NQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbcb6423e5435754088efc5fc79406a930af593b --- /dev/null +++ b/annotations_filtered/vEd2sU65NQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 29.32], [30.0, 43.73], [52.0, 55.97], [58.0, 58.36], [59.0, 66.36], [68.0, 103.37], [104.0, 138.13]], "keep_status": [true, false, true, false, false, false, false], "silence_prob": [31.69, 33.03, 37.63, 0.0, 32.05, 0.0, 0.0], "audiomae_on_audioset": [[["music", 43.01], ["speech", 17.56], ["didgeridoo", 4.97]], [["music", 61.82], ["speech", 11.04], ["gunshot, gunfire", 5.98]], [["music", 55.05], ["hum", 5.87], ["mains hum", 4.26]], null, [["music", 55.97], ["breaking", 23.99], ["smash, crash", 11.97]], null, null], "duration": [9.32, 13.73, 3.97, 0.36, 7.36, 35.37, 34.13]} \ No newline at end of file diff --git a/annotations_filtered/vEj9ZwIzk44_filtered.json b/annotations_filtered/vEj9ZwIzk44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60ec9e39c56e00f4f9380afb3fea877c06ce020d --- /dev/null +++ b/annotations_filtered/vEj9ZwIzk44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.09], [10.0, 11.99], [14.0, 16.5], [17.0, 20.76], [22.0, 34.86], [40.0, 40.24], [40.0, 42.67], [46.0, 46.3], [47.0, 52.62], [55.0, 57.08], [59.0, 62.09], [63.0, 68.03], [69.0, 70.7], [72.0, 73.08], [74.0, 77.45], [78.0, 78.88], [80.0, 88.45], [90.0, 90.61], [93.0, 94.39], [95.0, 97.02], [97.0, 97.06], [97.0, 97.12], [98.0, 98.44], [98.0, 98.58], [99.0, 98.68], [103.0, 115.42], [126.0, 129.41], [131.0, 131.16], [132.0, 134.03], [134.0, 134.82], [137.0, 138.37], [140.0, 140.39], [143.0, 143.36], [144.0, 145.4], [147.0, 153.87], [155.0, 156.09], [158.0, 163.46], [165.0, 166.13], [167.0, 169.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.43, 0.0, 99.96, 99.76, 99.82, 0.0, 99.91, 0.0, 89.72, 99.68, 88.1, 99.76, 0.0, 0.0, 98.01, 0.0, 89.54, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 71.57, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 87.74, 0.0, 94.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.09, 1.99, 2.5, 3.76, 12.86, 0.24, 2.67, 0.3, 5.62, 2.08, 3.09, 5.03, 1.7, 1.08, 3.45, 0.88, 8.45, 0.61, 1.39, 2.02, 0.06, 0.12, 0.44, 0.58, -0.32, 12.42, 3.41, 0.16, 2.03, 0.82, 1.37, 0.39, 0.36, 1.4, 6.87, 1.09, 5.46, 1.13, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/vEt5MqYD_3s_filtered.json b/annotations_filtered/vEt5MqYD_3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27f4c98e219354d8941f8dad1101f4af70afe6c1 --- /dev/null +++ b/annotations_filtered/vEt5MqYD_3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [4.0, 4.09], [5.0, 5.54], [13.0, 14.42], [22.0, 22.52], [25.0, 25.78], [30.0, 33.54], [35.0, 35.55], [40.0, 42.52], [45.0, 45.27], [46.0, 46.33], [47.0, 48.12], [49.0, 49.49], [51.0, 51.19], [52.0, 52.76], [54.0, 54.78], [105.0, 105.8], [118.0, 118.98], [129.0, 130.01]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.15, 0.0, 39.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 16.75], ["speech", 13.84], ["hum", 12.79]], null, [["moo", 33.47], ["cattle, bovinae", 21.74], ["speech", 9.52]], null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.09, 0.54, 1.42, 0.52, 0.78, 3.54, 0.55, 2.52, 0.27, 0.33, 1.12, 0.49, 0.19, 0.76, 0.78, 0.8, 0.98, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/vEv9tQL3b-A_filtered.json b/annotations_filtered/vEv9tQL3b-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d7bdbc78fdacaeb3767f9e146e24956a9b51e6e --- /dev/null +++ b/annotations_filtered/vEv9tQL3b-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.3], [9.0, 9.88], [14.0, 14.18], [16.0, 16.85], [22.0, 22.38], [24.0, 25.07], [27.0, 36.69], [39.0, 49.15], [54.0, 64.13], [64.0, 64.17], [69.0, 70.26], [71.0, 71.78], [72.0, 73.74], [74.0, 73.84], [77.0, 82.9], [83.0, 91.81], [95.0, 96.77], [100.0, 101.06], [101.0, 101.76], [103.0, 104.68], [106.0, 108.06], [114.0, 121.95], [122.0, 122.77], [127.0, 127.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.06, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 63.42, 53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 61.67, 0.0, 0.0, 0.0, 0.0, 70.16, 56.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.3, 0.88, 0.18, 0.85, 0.38, 1.07, 9.69, 10.15, 10.13, 0.17, 1.26, 0.78, 1.74, -0.16, 5.9, 8.81, 1.77, 1.06, 0.76, 1.68, 2.06, 7.95, 0.77, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/vF-tPvPAqhQ_filtered.json b/annotations_filtered/vF-tPvPAqhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f6d32521bfc5ff803b5fedccf9e759fbe5d730d --- /dev/null +++ b/annotations_filtered/vF-tPvPAqhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [4.0, 5.21], [6.0, 6.54], [8.0, 10.1], [13.0, 31.21], [41.0, 41.23], [44.0, 45.77], [59.0, 62.58], [64.0, 65.67], [67.0, 68.49], [69.0, 69.16], [71.0, 72.55], [74.0, 74.29], [75.0, 79.49], [81.0, 81.3], [84.0, 84.32], [87.0, 88.42], [90.0, 90.88], [93.0, 94.74], [95.0, 94.9], [98.0, 98.47], [104.0, 107.03], [110.0, 111.25], [113.0, 130.82], [133.0, 137.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.85, 30.73, 0.0, 0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.24, 0.0, 28.82, 36.28], "audiomae_on_audioset": [null, null, null, null, [["speech", 51.87], ["buzz", 13.01], ["music", 10.67]], null, null, [["music", 46.24], ["hands", 10.86], ["synthesizer", 4.4]], null, null, null, null, null, [["mains hum", 28.17], ["hum", 26.97], ["speech", 12.77]], null, null, null, null, null, null, null, [["music", 24.91], ["speech", 24.89], ["hum", 19.9]], null, [["music", 55.9], ["throbbing", 14.95], ["hum", 9.59]], [["music", 62.18], ["synthesizer", 7.8], ["electronic music", 3.53]]], "duration": [1.52, 1.21, 0.54, 2.1, 18.21, 0.23, 1.77, 3.58, 1.67, 1.49, 0.16, 1.55, 0.29, 4.49, 0.3, 0.32, 1.42, 0.88, 1.74, -0.1, 0.47, 3.03, 1.25, 17.82, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/vF3sZj6ge18_filtered.json b/annotations_filtered/vF3sZj6ge18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35714bf693e9000a4969de25ccb502500e243734 --- /dev/null +++ b/annotations_filtered/vF3sZj6ge18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [6.0, 10.02], [11.0, 11.7], [12.0, 13.93], [17.0, 17.54], [22.0, 23.65], [30.0, 30.11], [33.0, 35.68], [36.0, 37.15], [39.0, 43.6], [58.0, 58.29], [67.0, 68.17], [80.0, 81.73], [87.0, 92.62], [103.0, 103.94], [130.0, 129.84], [133.0, 132.98], [134.0, 138.45], [147.0, 148.71]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 32.56, 0.0, 0.0, 0.0, 31.46, 0.0, 0.0, 0.0, 44.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 41.31], ["theremin", 7.56], ["synthesizer", 6.25]], null, [["speech", 38.14], ["music", 12.2], ["creak", 4.33]], null, null, null, [["music", 16.45], ["shofar", 9.64], ["mosquito", 8.35]], null, null, null, [["crushing", 34.47], ["noise", 18.26], ["sidetone", 5.35]], null], "duration": [0.22, 4.02, 0.7, 1.93, 0.54, 1.65, 0.11, 2.68, 1.15, 4.6, 0.29, 1.17, 1.73, 5.62, 0.94, -0.16, -0.02, 4.45, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/vFAE-ZIntVI_filtered.json b/annotations_filtered/vFAE-ZIntVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56438a835d9d8ec3184ac2f04b7da26c9330543b --- /dev/null +++ b/annotations_filtered/vFAE-ZIntVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 61.48], [65.0, 78.39], [85.0, 103.45], [104.0, 104.53]], "keep_status": [false, true, true, false], "silence_prob": [0.0, 33.09, 45.98, 0.0], "audiomae_on_audioset": [null, [["music", 53.9], ["crack", 7.99], ["thunk", 5.0]], [["speech", 33.7], ["hum", 14.87], ["mains hum", 6.74]], null], "duration": [54.48, 13.39, 18.45, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/vFD6BbYg0-0_filtered.json b/annotations_filtered/vFD6BbYg0-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbff36cc864af272c8745bf53ad10fa03d0ccf43 --- /dev/null +++ b/annotations_filtered/vFD6BbYg0-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.98], [15.0, 17.24], [19.0, 25.39], [26.0, 32.44], [34.0, 41.15], [43.0, 45.47], [47.0, 90.24], [92.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [49.04, 64.97, 54.56, 52.86, 64.97, 59.33, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 55.08], ["music", 10.16], ["hum", 5.49]], null, null, null, null, null, null, null], "duration": [8.98, 2.24, 6.39, 6.44, 7.15, 2.47, 43.24, 35.38]} \ No newline at end of file diff --git a/annotations_filtered/vFHYiOfBRng_filtered.json b/annotations_filtered/vFHYiOfBRng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..994a770880be42d53f61b302d4a71e8f68cdafbd --- /dev/null +++ b/annotations_filtered/vFHYiOfBRng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 70.31], [131.0, 133.54], [136.0, 144.24], [146.0, 146.77], [149.0, 151.16], [154.0, 154.85], [159.0, 159.56], [164.0, 174.6]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 96.66, 0.0, 99.95, 0.0, 0.0, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.31, 2.54, 8.24, 0.77, 2.16, 0.85, 0.56, 10.6]} \ No newline at end of file diff --git a/annotations_filtered/vFPRSImZev4_filtered.json b/annotations_filtered/vFPRSImZev4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654f6486f0bf61530c7bdcf3d94f5598943b82b6 --- /dev/null +++ b/annotations_filtered/vFPRSImZev4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.62], [7.0, 8.58], [9.0, 22.77], [24.0, 55.02], [56.0, 59.7], [61.0, 63.02], [63.0, 63.76], [64.0, 75.84], [79.0, 110.13], [111.0, 111.18], [113.0, 114.78], [116.0, 119.1], [120.0, 122.37], [125.0, 128.73], [129.0, 132.88], [136.0, 137.61], [140.0, 143.51], [144.0, 149.15], [150.0, 154.31], [156.0, 156.46], [157.0, 157.17], [157.0, 162.7], [164.0, 165.47], [166.0, 169.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.38, 0.0, 58.55, 0.0, 99.99, 82.07, 0.0, 99.36, 0.0, 0.0, 0.0, 99.62, 87.37, 99.99, 97.92, 0.0, 99.95, 99.1, 99.84, 0.0, 0.0, 44.09, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.34], ["inside, small room", 2.86], ["thunk", 2.34]], null, null], "duration": [2.62, 1.58, 13.77, 31.02, 3.7, 2.02, 0.76, 11.84, 31.13, 0.18, 1.78, 3.1, 2.37, 3.73, 3.88, 1.61, 3.51, 5.15, 4.31, 0.46, 0.17, 5.7, 1.47, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/vFSAQ1Nj7fg_filtered.json b/annotations_filtered/vFSAQ1Nj7fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdb70bc0d44050edd5c457197d02e67c01db06d3 --- /dev/null +++ b/annotations_filtered/vFSAQ1Nj7fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.33], [12.0, 12.26], [18.0, 18.13], [21.0, 21.81], [23.0, 29.34], [36.0, 36.22], [42.0, 42.52], [44.0, 45.76], [52.0, 57.35], [75.0, 78.58], [80.0, 83.83], [85.0, 90.61], [91.0, 91.61], [95.0, 95.2], [100.0, 100.62], [105.0, 119.1], [124.0, 125.07], [127.0, 127.79], [131.0, 131.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 0.0, 31.63, 52.86, 41.89, 30.12, 0.0, 0.0, 0.0, 31.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 45.01], ["fart", 20.7], ["explosion", 5.08]], null, null, null, [["speech", 64.85], ["music", 8.13], ["fireworks", 6.54]], null, [["music", 64.0], ["hum", 11.1], ["throbbing", 6.33]], [["speech", 16.94], ["music", 10.67], ["vehicle", 6.23]], null, null, null, [["speech", 67.19], ["music", 19.32], ["fart", 2.27]], null, null, null], "duration": [0.33, 0.26, 0.13, 0.81, 6.34, 0.22, 0.52, 1.76, 5.35, 3.58, 3.83, 5.61, 0.61, 0.2, 0.62, 14.1, 1.07, 0.79, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/vFqitPr_Gpg_filtered.json b/annotations_filtered/vFqitPr_Gpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/vFqitPr_Gpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/vG6bW7_-CRQ_filtered.json b/annotations_filtered/vG6bW7_-CRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7de5ba89262be64da0b9cd28a8ca2ab34ef86b09 --- /dev/null +++ b/annotations_filtered/vG6bW7_-CRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.96], [11.0, 11.2], [12.0, 12.5], [14.0, 14.55], [15.0, 16.28], [17.0, 18.94], [20.0, 23.35], [26.0, 27.28], [36.0, 37.05], [38.0, 39.19], [41.0, 41.23], [42.0, 42.21], [44.0, 44.42], [46.0, 46.41], [48.0, 49.92], [55.0, 56.64], [60.0, 60.84], [63.0, 64.27], [71.0, 77.03], [79.0, 80.0], [81.0, 81.82], [83.0, 84.33], [86.0, 93.41], [95.0, 95.27], [96.0, 114.37], [115.0, 133.0], [133.0, 135.21], [135.0, 148.49], [151.0, 176.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, true], "silence_prob": [87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.07, 0.0, 0.0, 0.0, 92.15, 0.0, 79.94, 49.09, 67.38, 43.79, 34.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 33.45], ["echo", 7.22], ["animal", 7.04]], null, null, null, null, null, null, [["synthesizer", 14.66], ["music", 10.74], ["noise", 10.2]], null, [["throbbing", 32.17], ["hum", 12.69], ["heart sounds, heartbeat", 12.56]], [["gunshot, gunfire", 26.37], ["cap gun", 6.17], ["chirp tone", 5.23]]], "duration": [3.96, 0.2, 0.5, 0.55, 1.28, 1.94, 3.35, 1.28, 1.05, 1.19, 0.23, 0.21, 0.42, 0.41, 1.92, 1.64, 0.84, 1.27, 6.03, 1.0, 0.82, 1.33, 7.41, 0.27, 18.37, 18.0, 2.21, 13.49, 25.35]} \ No newline at end of file diff --git a/annotations_filtered/vG833_jH7eY_filtered.json b/annotations_filtered/vG833_jH7eY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9cad2ed0ad6e49b110da147f7de7f0415708f4f --- /dev/null +++ b/annotations_filtered/vG833_jH7eY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.29], [8.0, 10.44], [11.0, 11.94], [12.0, 13.12], [14.0, 14.07], [14.0, 19.85], [20.0, 23.25], [23.0, 29.51], [31.0, 32.66], [34.0, 34.92], [35.0, 40.66], [44.0, 47.36], [48.0, 49.86], [53.0, 54.41], [55.0, 57.54], [62.0, 64.76], [67.0, 68.89], [70.0, 75.12], [78.0, 81.5], [82.0, 81.53], [87.0, 87.96], [94.0, 98.64], [99.0, 98.68], [99.0, 98.71], [100.0, 99.59], [100.0, 99.62], [100.0, 99.72], [100.0, 99.77], [100.0, 99.93], [100.0, 100.06], [101.0, 105.93], [107.0, 108.3], [109.0, 111.16], [113.0, 116.77], [119.0, 120.11], [121.0, 123.42]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.12, 32.3, 0.0, 0.0, 0.0, 82.43, 68.15, 37.14, 0.0, 0.0, 35.79, 36.57, 0.0, 0.0, 54.43, 58.89, 0.0, 37.82, 30.62, 0.0, 0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 50.97, 50.56, 0.0, 96.04], "audiomae_on_audioset": [[["speech", 77.84], ["male speech, man speaking", 3.61], ["hum", 2.52]], [["speech", 53.21], ["hum", 9.92], ["cough", 4.73]], null, null, null, null, null, [["speech", 86.46], ["hum", 2.31], ["radio", 1.43]], null, null, [["electric shaver, electric razor", 56.38], ["music", 14.42], ["speech", 9.08]], [["speech", 56.36], ["sidetone", 22.13], ["radio", 3.7]], null, null, null, null, null, [["speech", 46.2], ["music", 12.43], ["mains hum", 9.82]], [["speech", 37.07], ["music", 13.93], ["radio", 4.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.29, 2.44, 0.94, 1.12, 0.07, 5.85, 3.25, 6.51, 1.66, 0.92, 5.66, 3.36, 1.86, 1.41, 2.54, 2.76, 1.89, 5.12, 3.5, -0.47, 0.96, 4.64, -0.32, -0.29, -0.41, -0.38, -0.28, -0.23, -0.07, 0.06, 4.93, 1.3, 2.16, 3.77, 1.11, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/vG_FLK4K_T8_filtered.json b/annotations_filtered/vG_FLK4K_T8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56c5850242e829e5c3946ccaa15fb496d0e64260 --- /dev/null +++ b/annotations_filtered/vG_FLK4K_T8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [5.0, 7.74], [8.0, 9.37], [10.0, 10.71], [15.0, 16.53], [25.0, 25.73], [28.0, 28.78], [34.0, 34.89], [41.0, 54.85], [57.0, 59.53], [61.0, 62.14], [63.0, 64.17], [65.0, 67.29], [68.0, 68.5], [69.0, 71.54], [75.0, 75.93], [77.0, 78.75], [88.0, 88.7], [89.0, 93.39], [97.0, 98.0], [98.0, 100.62], [102.0, 103.67], [107.0, 107.64], [109.0, 110.57], [111.0, 113.07], [115.0, 118.69], [119.0, 119.87], [121.0, 120.78], [122.0, 122.94], [124.0, 124.65], [126.0, 128.34], [128.0, 129.51], [133.0, 134.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 78.38, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.66, 0.0, 98.86, 0.0, 0.0, 0.0, 100.0, 89.72, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 2.74, 1.37, 0.71, 1.53, 0.73, 0.78, 0.89, 13.85, 2.53, 1.14, 1.17, 2.29, 0.5, 2.54, 0.93, 1.75, 0.7, 4.39, 1.0, 2.62, 1.67, 0.64, 1.57, 2.07, 3.69, 0.87, -0.22, 0.94, 0.65, 2.34, 1.51, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/vGgdg2q1eig_filtered.json b/annotations_filtered/vGgdg2q1eig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..865d6ce1cc4ed19f19e095a81acb6fe76429ab2c --- /dev/null +++ b/annotations_filtered/vGgdg2q1eig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [2.0, 4.43], [10.0, 11.84], [19.0, 19.28], [22.0, 24.21], [36.0, 39.19], [42.0, 43.19], [46.0, 48.15], [49.0, 51.39], [53.0, 54.4], [55.0, 56.08], [57.0, 58.19], [60.0, 61.05], [69.0, 69.82], [71.0, 75.64], [76.0, 77.52], [81.0, 81.9], [84.0, 84.25], [91.0, 95.67], [112.0, 112.94], [124.0, 125.15], [128.0, 130.27]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 54.83, 0.0, 0.0, 50.46, 64.52, 0.0, 39.99, 42.53, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 0.0, 0.0, 0.0, 38.62, 0.0, 0.0, 87.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.59], ["radio", 12.24], ["bird", 9.6]], [["bird", 17.84], ["animal", 10.88], ["fly, housefly", 9.79]], null, null, null, null, null, null, null, null, null, [["insect", 24.94], ["speech", 13.71], ["cricket", 9.12]], null, null, null], "duration": [0.85, 2.43, 1.84, 0.28, 2.21, 3.19, 1.19, 2.15, 2.39, 1.4, 1.08, 1.19, 1.05, 0.82, 4.64, 1.52, 0.9, 0.25, 4.67, 0.94, 1.15, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/vH8nss4M93g_filtered.json b/annotations_filtered/vH8nss4M93g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e773f3c71ba355254b16f1666da9a96ef471489 --- /dev/null +++ b/annotations_filtered/vH8nss4M93g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.25], [4.0, 5.63], [7.0, 7.1], [10.0, 14.45], [17.0, 18.25], [19.0, 19.68], [22.0, 22.67], [25.0, 26.2], [29.0, 31.67], [32.0, 35.56], [37.0, 37.62], [38.0, 46.74], [54.0, 54.73], [58.0, 60.99], [74.0, 74.41], [81.0, 81.94]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [34.15, 0.0, 0.0, 32.96, 0.0, 0.0, 0.0, 0.0, 34.05, 33.74, 0.0, 32.53, 0.0, 31.84, 0.0, 0.0], "audiomae_on_audioset": [[["music", 14.54], ["speech", 13.38], ["mains hum", 13.17]], null, null, [["mains hum", 18.77], ["speech", 11.43], ["vehicle", 11.35]], null, null, null, null, [["hum", 44.92], ["mains hum", 27.16], ["music", 10.96]], [["hum", 36.08], ["mains hum", 33.87], ["speech", 9.39]], null, [["mains hum", 32.14], ["hum", 21.14], ["speech", 10.53]], null, [["music", 29.86], ["hum", 14.88], ["mains hum", 13.59]], null, null], "duration": [2.25, 1.63, 0.1, 4.45, 1.25, 0.68, 0.67, 1.2, 2.67, 3.56, 0.62, 8.74, 0.73, 2.99, 0.41, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/vHBKdIq9RGs_filtered.json b/annotations_filtered/vHBKdIq9RGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d50915d345d667e74f1fdc45f1653f325fd31c43 --- /dev/null +++ b/annotations_filtered/vHBKdIq9RGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.63], [22.0, 22.54], [30.0, 30.57], [31.0, 31.56], [44.0, 47.71], [75.0, 76.59], [77.0, 77.33], [91.0, 92.5], [94.0, 95.35], [99.0, 100.75], [118.0, 119.7], [122.0, 122.64], [129.0, 128.83], [132.0, 133.79], [152.0, 156.81], [157.0, 157.55], [172.0, 171.9]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [35.08, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.67, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 18.27], ["grunt", 15.96], ["moo", 13.1]], null, null, null, [["speech", 40.79], ["music", 15.59], ["boing", 11.68]], null, null, null, null, null, null, null, null, null, [["music", 33.34], ["throbbing", 13.47], ["hum", 12.25]], null, null], "duration": [3.63, 0.54, 0.57, 0.56, 3.71, 1.59, 0.33, 1.5, 1.35, 1.75, 1.7, 0.64, -0.17, 1.79, 4.81, 0.55, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/vHbBhI0xLjA_filtered.json b/annotations_filtered/vHbBhI0xLjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26561422816206e3b186429bbdb906fb34b6df80 --- /dev/null +++ b/annotations_filtered/vHbBhI0xLjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.74], [12.0, 16.16], [17.0, 17.19], [26.0, 28.38]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 32.5, 0.0, 33.78], "audiomae_on_audioset": [null, [["music", 50.09], ["synthesizer", 7.79], ["musical instrument", 6.02]], null, [["music", 55.56], ["synthesizer", 5.7], ["musical instrument", 4.23]]], "duration": [0.74, 4.16, 0.19, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/vHmyJqXxmL8_filtered.json b/annotations_filtered/vHmyJqXxmL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04f229124ad1344e7aa7e9c67fa5dfa9675278c4 --- /dev/null +++ b/annotations_filtered/vHmyJqXxmL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.68], [16.0, 18.49], [25.0, 25.76], [29.0, 29.49], [37.0, 45.64], [47.0, 52.79], [53.0, 55.93], [56.0, 56.05], [56.0, 63.44], [66.0, 68.13], [69.0, 69.2], [70.0, 74.78], [75.0, 84.11], [92.0, 99.35], [102.0, 112.45], [115.0, 118.12], [119.0, 119.45], [124.0, 124.73]], "keep_status": [false, true, false, false, false, false, true, false, true, true, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 38.04, 0.0, 0.0, 36.65, 33.93, 36.39, 0.0, 33.41, 40.61, 0.0, 38.14, 33.59, 35.65, 30.82, 32.56, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.41], ["synthesizer", 8.81], ["bouncing", 7.97]], null, null, [["music", 50.42], ["speech", 18.12], ["didgeridoo", 8.67]], [["music", 77.95], ["speech", 4.98], ["musical instrument", 2.19]], [["music", 21.54], ["whack, thwack", 14.35], ["thunk", 14.0]], null, [["music", 26.49], ["livestock, farm animals, working animals", 9.65], ["cattle, bovinae", 5.92]], [["music", 36.46], ["mosquito", 4.69], ["roar", 2.85]], null, [["music", 70.77], ["quack", 9.99], ["fart", 6.68]], [["music", 47.16], ["speech", 36.13], ["theremin", 5.92]], [["music", 40.42], ["speech", 11.68], ["hum", 5.49]], [["music", 42.86], ["buzz", 12.56], ["boing", 9.03]], [["music", 37.76], ["speech", 7.47], ["buzz", 3.25]], null, null], "duration": [0.68, 2.49, 0.76, 0.49, 8.64, 5.79, 2.93, 0.05, 7.44, 2.13, 0.2, 4.78, 9.11, 7.35, 10.45, 3.12, 0.45, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/vITX2N0hpYE_filtered.json b/annotations_filtered/vITX2N0hpYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf8da6eaeaf6e7c18556a873778c0f22ce2aac3 --- /dev/null +++ b/annotations_filtered/vITX2N0hpYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 23.87], [31.0, 32.97], [34.0, 35.45], [42.0, 42.38], [44.0, 44.71], [47.0, 47.98], [49.0, 50.73], [51.0, 51.71], [54.0, 54.73], [55.0, 55.68], [57.0, 73.01], [75.0, 75.78], [77.0, 78.33], [79.0, 80.23], [81.0, 86.61], [89.0, 91.71], [94.0, 143.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 40.95, 61.87, 0.0], "audiomae_on_audioset": [[["sidetone", 80.06], ["radio", 4.66], ["hum", 2.81]], null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 22.39], ["moo", 17.54], ["livestock, farm animals, working animals", 12.72]], null, null, null, [["speech", 56.34], ["sidetone", 22.23], ["busy signal", 7.03]], null, null], "duration": [5.87, 1.97, 1.45, 0.38, 0.71, 0.98, 1.73, 0.71, 0.73, 0.68, 16.01, 0.78, 1.33, 1.23, 5.61, 2.71, 49.97]} \ No newline at end of file diff --git a/annotations_filtered/vI_kMlvUWDw_filtered.json b/annotations_filtered/vI_kMlvUWDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edcebd127eed3ec4ce1ac3d04a7abab69a61ae59 --- /dev/null +++ b/annotations_filtered/vI_kMlvUWDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 5.29], [11.0, 11.62], [23.0, 23.82], [33.0, 35.28], [39.0, 38.79], [40.0, 40.53], [56.0, 56.42], [60.0, 61.84], [64.0, 67.95], [75.0, 75.03], [77.0, 77.36], [86.0, 86.83], [87.0, 99.06], [99.0, 99.66], [102.0, 102.59], [106.0, 106.57], [108.0, 112.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 0.0, 49.54], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 81.68], ["speech", 8.84], ["hum", 1.74]], null, null, null, null, [["speech", 50.68], ["music", 21.47], ["hum", 4.94]], null, null, null, [["speech", 33.73], ["music", 26.91], ["throbbing", 11.59]], null, null, null, [["music", 42.74], ["hum", 11.37], ["didgeridoo", 11.19]]], "duration": [0.94, 1.29, 0.62, 0.82, 2.28, -0.21, 0.53, 0.42, 1.84, 3.95, 0.03, 0.36, 0.83, 12.06, 0.66, 0.59, 0.57, 4.51]} \ No newline at end of file diff --git a/annotations_filtered/vIaVITC62Cs_filtered.json b/annotations_filtered/vIaVITC62Cs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fae7cd2622aea19cb17cd7fd074f2bd85584ddc6 --- /dev/null +++ b/annotations_filtered/vIaVITC62Cs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 68.82], [73.0, 74.55], [76.0, 77.77], [87.0, 87.86], [89.0, 89.16], [91.0, 95.23]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.7], "audiomae_on_audioset": [null, null, null, null, null, [["horse", 23.18], ["livestock, farm animals, working animals", 11.44], ["cattle, bovinae", 10.85]]], "duration": [37.82, 1.55, 1.77, 0.86, 0.16, 4.23]} \ No newline at end of file diff --git a/annotations_filtered/vId4AoKDg2s_filtered.json b/annotations_filtered/vId4AoKDg2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe0181fde87643958033d73521735cb6058c24e1 --- /dev/null +++ b/annotations_filtered/vId4AoKDg2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 8.16], [10.0, 10.93], [16.0, 36.24], [50.0, 51.38], [60.0, 69.65], [71.0, 72.79], [74.0, 76.52], [78.0, 78.41], [80.0, 81.06], [83.0, 83.61], [87.0, 87.52], [88.0, 88.89], [92.0, 92.99], [95.0, 95.2], [97.0, 96.87], [99.0, 99.27], [101.0, 101.09], [103.0, 103.77], [107.0, 108.31], [111.0, 111.0], [112.0, 112.26], [112.0, 114.4], [117.0, 116.87]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.06, 0.0, 33.48, 0.0, 33.6, 0.0, 42.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0], "audiomae_on_audioset": [null, [["music", 51.87], ["didgeridoo", 9.14], ["musical instrument", 4.94]], null, [["music", 44.57], ["speech", 11.38], ["bleat", 5.29]], null, [["music", 67.98], ["crying, sobbing", 1.96], ["musical instrument", 1.95]], null, [["music", 37.77], ["speech", 7.1], ["electronic music", 5.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 2.16, 0.93, 20.24, 1.38, 9.65, 1.79, 2.52, 0.41, 1.06, 0.61, 0.52, 0.89, 0.99, 0.2, -0.13, 0.27, 0.09, 0.77, 1.31, 0.0, 0.26, 2.4, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/vIrRt0vaySY_filtered.json b/annotations_filtered/vIrRt0vaySY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c60d2262867577c2be76b6fc3c1415d21d5f9853 --- /dev/null +++ b/annotations_filtered/vIrRt0vaySY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 29.24], [31.0, 32.58], [40.0, 43.11], [44.0, 44.61], [46.0, 46.35], [47.0, 50.8], [51.0, 52.0], [56.0, 55.85], [58.0, 74.88], [82.0, 84.72], [112.0, 113.0], [128.0, 129.3], [132.0, 139.6], [140.0, 144.59], [145.0, 148.1], [149.0, 152.41]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.29, 0.0, 42.79, 0.0, 0.0, 38.84, 0.0, 0.0, 57.81, 44.32, 0.0, 0.0, 84.43, 98.51, 92.15, 63.85], "audiomae_on_audioset": [[["speech", 20.96], ["wheeze", 13.37], ["animal", 6.81]], null, [["whip", 10.72], ["fart", 7.25], ["clang", 5.33]], null, null, [["speech", 70.1], ["animal", 2.94], ["buzz", 2.13]], null, null, null, [["cattle, bovinae", 52.65], ["moo", 25.57], ["livestock, farm animals, working animals", 15.57]], null, null, null, null, null, null], "duration": [7.24, 1.58, 3.11, 0.61, 0.35, 3.8, 1.0, -0.15, 16.88, 2.72, 1.0, 1.3, 7.6, 4.59, 3.1, 3.41]} \ No newline at end of file diff --git a/annotations_filtered/vJ6XJtlqqZo_filtered.json b/annotations_filtered/vJ6XJtlqqZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73dcd87ebf3c450139c73f034c4adcf9f4c78676 --- /dev/null +++ b/annotations_filtered/vJ6XJtlqqZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [7.0, 8.02], [10.0, 11.8], [12.0, 14.07], [14.0, 15.5], [19.0, 19.08], [19.0, 21.61], [22.0, 25.59], [30.0, 29.83], [32.0, 32.02], [33.0, 34.08], [36.0, 36.96], [40.0, 41.99], [43.0, 43.01], [45.0, 47.8], [49.0, 49.62], [50.0, 51.97], [56.0, 57.05], [58.0, 59.98], [61.0, 62.72], [67.0, 68.91], [70.0, 70.46], [73.0, 75.2], [77.0, 81.04], [83.0, 85.41], [86.0, 87.25], [88.0, 89.24], [92.0, 93.46], [96.0, 96.52], [97.0, 97.04], [97.0, 98.37], [105.0, 107.1], [108.0, 110.0], [112.0, 113.53], [115.0, 116.95], [119.0, 125.32], [132.0, 143.19], [145.0, 145.32], [146.0, 147.46], [149.0, 153.39], [154.0, 157.91], [167.0, 167.86], [169.0, 173.91], [174.0, 177.35], [178.0, 178.5], [179.0, 178.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 95.78, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 100.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.13, 0.0, 0.0, 99.68, 99.88, 0.0, 0.0, 100.0, 99.16, 0.0, 37.74, 40.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.08], ["speech", 24.21], ["sneeze", 3.47]], [["music", 53.24], ["speech", 25.97], ["musical instrument", 6.39]], null, null], "duration": [0.76, 1.02, 1.8, 2.07, 1.5, 0.08, 2.61, 3.59, -0.17, 0.02, 1.08, 0.96, 1.99, 0.01, 2.8, 0.62, 1.97, 1.05, 1.98, 1.72, 1.91, 0.46, 2.2, 4.04, 2.41, 1.25, 1.24, 1.46, 0.52, 0.04, 1.37, 2.1, 2.0, 1.53, 1.95, 6.32, 11.19, 0.32, 1.46, 4.39, 3.91, 0.86, 4.91, 3.35, 0.5, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/vJCHzRIOOL0_filtered.json b/annotations_filtered/vJCHzRIOOL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2c3bf684d9da79b9369354e9ae3faaea266199f --- /dev/null +++ b/annotations_filtered/vJCHzRIOOL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [6.0, 5.97], [11.0, 11.57], [20.0, 20.02], [21.0, 21.05], [25.0, 25.96], [27.0, 28.09], [31.0, 34.45], [35.0, 35.99], [39.0, 39.06], [42.0, 42.89], [52.0, 52.68], [54.0, 54.41], [56.0, 56.2], [58.0, 57.99], [60.0, 59.83], [60.0, 60.79], [63.0, 63.44], [65.0, 67.14], [68.0, 68.76], [70.0, 70.82], [74.0, 75.37], [76.0, 76.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, -0.03, 0.57, 0.02, 0.05, 0.96, 1.09, 3.45, 0.99, 0.06, 0.89, 0.68, 0.41, 0.2, -0.01, -0.17, 0.79, 0.44, 2.14, 0.76, 0.82, 1.37, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/vJFN-ZPqCiQ_filtered.json b/annotations_filtered/vJFN-ZPqCiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1721a7f5c45e37e4585ba3f30a78c9e52226a35 --- /dev/null +++ b/annotations_filtered/vJFN-ZPqCiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.11], [9.0, 10.2], [11.0, 12.29], [13.0, 13.78], [14.0, 19.57], [21.0, 21.25], [23.0, 23.82], [25.0, 25.24], [34.0, 35.82], [36.0, 36.88], [45.0, 53.4], [54.0, 59.59], [68.0, 69.7], [73.0, 79.69], [80.0, 82.68], [84.0, 84.89], [86.0, 87.22], [94.0, 95.23], [96.0, 97.17], [102.0, 103.69], [106.0, 106.29], [108.0, 110.34], [110.0, 110.94], [121.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.16, 0.0, 100.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 1.2, 1.29, 0.78, 5.57, 0.25, 0.82, 0.24, 1.82, 0.88, 8.4, 5.59, 1.7, 6.69, 2.68, 0.89, 1.22, 1.23, 1.17, 1.69, 0.29, 2.34, 0.94, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/vJZe9sHz10M_filtered.json b/annotations_filtered/vJZe9sHz10M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c49ff1533fb3f3878874c7964ec84165a06da34e --- /dev/null +++ b/annotations_filtered/vJZe9sHz10M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [23.0, 23.48], [70.0, 70.78], [81.0, 84.38]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.23], "audiomae_on_audioset": [null, null, null, [["speech", 54.73], ["horse", 16.01], ["clip-clop", 11.56]]], "duration": [0.61, 0.48, 0.78, 3.38]} \ No newline at end of file diff --git a/annotations_filtered/vJhO79OGi20_filtered.json b/annotations_filtered/vJhO79OGi20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65f38b105a0db8cdb540b31a6803028a366c8d11 --- /dev/null +++ b/annotations_filtered/vJhO79OGi20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.33], [16.0, 18.05], [19.0, 22.99], [27.0, 32.41], [34.0, 33.99], [34.0, 34.8], [37.0, 37.99], [42.0, 42.45], [43.0, 44.69], [45.0, 52.1], [54.0, 54.9], [56.0, 57.97], [59.0, 60.44], [61.0, 67.53], [68.0, 69.21], [76.0, 78.12], [79.0, 83.49], [97.0, 97.39], [105.0, 109.68], [115.0, 116.07], [117.0, 121.22], [128.0, 128.04], [128.0, 128.88], [130.0, 131.57], [132.0, 132.97], [138.0, 140.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, true], "silence_prob": [82.97, 82.25, 80.11, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 33.2, 0.0, 35.93, 39.85, 0.0, 29.8, 0.0, 35.25, 0.0, 0.0, 0.0, 0.0, 29.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.17], ["hum", 12.06], ["music", 9.85]], null, [["speech", 76.24], ["music", 8.01], ["gong", 3.42]], [["speech", 26.15], ["music", 11.49], ["hum", 9.41]], null, [["speech", 46.18], ["breaking", 35.59], ["music", 4.58]], null, [["music", 34.29], ["speech", 14.48], ["theremin", 12.62]], null, null, null, null, [["hum", 28.4], ["music", 17.73], ["mains hum", 16.28]]], "duration": [2.33, 2.05, 3.99, 5.41, -0.01, 0.8, 0.99, 0.45, 1.69, 7.1, 0.9, 1.97, 1.44, 6.53, 1.21, 2.12, 4.49, 0.39, 4.68, 1.07, 4.22, 0.04, 0.88, 1.57, 0.97, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/vJi3kGaAQfo_filtered.json b/annotations_filtered/vJi3kGaAQfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28ecff894e8a9a7248555cb600aa78126409221a --- /dev/null +++ b/annotations_filtered/vJi3kGaAQfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.03], [13.0, 14.0], [15.0, 17.04], [18.0, 19.52], [21.0, 22.69], [24.0, 24.93], [26.0, 32.46], [33.0, 34.01], [36.0, 36.34], [38.0, 45.6], [46.0, 46.99], [47.0, 47.02], [47.0, 84.01], [87.0, 88.3], [90.0, 97.61], [99.0, 106.52], [109.0, 120.51], [126.0, 127.77], [132.0, 136.53], [137.0, 153.57], [158.0, 160.03], [161.0, 161.81], [162.0, 169.5], [173.0, 184.08]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, true, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 36.99, 30.81, 33.61, 0.0, 32.32, 31.96, 34.91, 0.0, 30.6, 48.65], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 15.41], ["speech", 14.68], ["music", 10.43]], null, null, [["throbbing", 30.49], ["speech", 18.47], ["hum", 16.31]], null, null, null, null, [["throbbing", 42.08], ["music", 13.96], ["quack", 8.22]], [["animal", 15.8], ["dog", 14.1], ["music", 13.64]], [["beatboxing", 24.53], ["hum", 16.33], ["mains hum", 11.87]], null, [["livestock, farm animals, working animals", 15.74], ["moo", 14.28], ["speech", 11.37]], [["speech", 30.11], ["hum", 30.09], ["mains hum", 8.68]], [["music", 56.5], ["throbbing", 17.04], ["hum", 11.66]], null, [["music", 43.18], ["whack, thwack", 14.16], ["breaking", 6.0]], [["music", 47.38], ["hum", 15.2], ["sonar", 8.77]]], "duration": [1.03, 1.0, 2.04, 1.52, 1.69, 0.93, 6.46, 1.01, 0.34, 7.6, 0.99, 0.02, 37.01, 1.3, 7.61, 7.52, 11.51, 1.77, 4.53, 16.57, 2.03, 0.81, 7.5, 11.08]} \ No newline at end of file diff --git a/annotations_filtered/vJzOCmyQY24_filtered.json b/annotations_filtered/vJzOCmyQY24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..047ad2e9fda14dcba65daf4935000ccb2ba66370 --- /dev/null +++ b/annotations_filtered/vJzOCmyQY24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[115.0, 118.67], [119.0, 137.69]], "keep_status": [true, true], "silence_prob": [40.73, 46.57], "audiomae_on_audioset": [[["speech", 52.45], ["groan", 3.78], ["music", 3.66]], [["music", 38.73], ["speech", 8.62], ["musical instrument", 3.2]]], "duration": [3.67, 18.69]} \ No newline at end of file diff --git a/annotations_filtered/vK7tEsNZtFs_filtered.json b/annotations_filtered/vK7tEsNZtFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5187215ce91840e72ee3ecef5a15e0600d60a81a --- /dev/null +++ b/annotations_filtered/vK7tEsNZtFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.47], [17.0, 17.78], [20.0, 20.9], [22.0, 23.92], [26.0, 26.54], [28.0, 29.42], [33.0, 33.35], [35.0, 37.99], [64.0, 65.5], [74.0, 75.52]], "keep_status": [true, false, false, false, false, false, false, true, false, false], "silence_prob": [32.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 30.69], ["speech", 22.91], ["moo", 13.1]], null, null, null, null, null, null, [["crowd", 24.51], ["speech", 18.6], ["outside, urban or manmade", 15.33]], null, null], "duration": [5.47, 0.78, 0.9, 1.92, 0.54, 1.42, 0.35, 2.99, 1.5, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/vKEWdfB8yo8_filtered.json b/annotations_filtered/vKEWdfB8yo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ae6eddb91ad57690461cae3e6f90780bd3830a9 --- /dev/null +++ b/annotations_filtered/vKEWdfB8yo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [9.0, 9.8], [11.0, 11.35], [12.0, 13.53], [19.0, 19.58], [23.0, 23.57], [26.0, 26.28], [30.0, 29.94], [31.0, 31.63], [36.0, 39.09], [43.0, 43.87], [45.0, 45.96], [48.0, 48.47], [52.0, 52.81], [61.0, 61.87], [67.0, 67.14], [72.0, 72.72], [76.0, 77.16], [82.0, 84.16], [87.0, 88.11], [89.0, 89.63], [90.0, 94.36], [96.0, 96.75], [101.0, 101.6], [104.0, 104.23], [105.0, 109.32], [110.0, 113.53], [116.0, 116.06], [117.0, 118.08], [118.0, 118.66], [119.0, 119.94], [122.0, 123.18], [124.0, 124.75], [127.0, 128.41], [130.0, 138.69], [140.0, 142.64], [145.0, 145.62], [146.0, 147.01], [149.0, 148.91], [153.0, 153.82], [155.0, 155.14], [159.0, 159.61], [161.0, 160.98], [162.0, 161.97], [165.0, 166.09], [168.0, 167.86], [168.0, 175.29], [176.0, 176.45], [184.0, 187.08], [188.0, 192.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 45.46, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 98.66, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 15.92], ["burst, pop", 12.03], ["synthesizer", 4.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.8, 0.35, 1.53, 0.58, 0.57, 0.28, -0.06, 0.63, 3.09, 0.87, 0.96, 0.47, 0.81, 0.87, 0.14, 0.72, 1.16, 2.16, 1.11, 0.63, 4.36, 0.75, 0.6, 0.23, 4.32, 3.53, 0.06, 1.08, 0.66, 0.94, 1.18, 0.75, 1.41, 8.69, 2.64, 0.62, 1.01, -0.09, 0.82, 0.14, 0.61, -0.02, -0.03, 1.09, -0.14, 7.29, 0.45, 3.08, 4.28]} \ No newline at end of file diff --git a/annotations_filtered/vKEqdQhX4lo_filtered.json b/annotations_filtered/vKEqdQhX4lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16545bbc10662377978a40e63a32103e5043062f --- /dev/null +++ b/annotations_filtered/vKEqdQhX4lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.67], [6.0, 6.71], [8.0, 9.37], [11.0, 13.36], [17.0, 19.09], [25.0, 25.19], [33.0, 34.32], [36.0, 36.46], [38.0, 53.5], [54.0, 55.8], [57.0, 58.21], [59.0, 59.19], [60.0, 61.05], [63.0, 65.42], [68.0, 68.55], [72.0, 74.34], [75.0, 75.52], [76.0, 77.14], [80.0, 82.38], [86.0, 86.48], [88.0, 87.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.41, 74.44, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 88.83, 0.0, 0.0, 44.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.17], ["hum", 6.11], ["speech", 3.13]], null, null], "duration": [0.67, 0.71, 1.37, 2.36, 2.09, 0.19, 1.32, 0.46, 15.5, 1.8, 1.21, 0.19, 1.05, 2.42, 0.55, 2.34, 0.52, 1.14, 2.38, 0.48, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/vKMMeOLK9Y4_filtered.json b/annotations_filtered/vKMMeOLK9Y4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60f198799d3b535a5c4599d9ad886bdaa697b7f0 --- /dev/null +++ b/annotations_filtered/vKMMeOLK9Y4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.99], [21.0, 26.33], [29.0, 29.15], [31.0, 30.77], [34.0, 45.71], [50.0, 69.55], [73.0, 86.1], [92.0, 92.82], [102.0, 103.86], [105.0, 107.06], [108.0, 110.22], [112.0, 112.85], [114.0, 120.06], [123.0, 130.0]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [29.7, 27.92, 0.0, 0.0, 28.15, 28.16, 28.47, 0.0, 0.0, 33.47, 33.37, 0.0, 29.01, 28.44], "audiomae_on_audioset": [[["music", 51.94], ["speech", 13.57], ["throbbing", 7.0]], [["music", 83.65], ["speech", 2.05], ["house music", 1.32]], null, null, [["music", 77.33], ["speech", 4.68], ["electronic music", 2.95]], [["music", 84.75], ["house music", 3.26], ["electronic music", 2.04]], [["speech", 44.95], ["music", 8.83], ["vehicle", 5.01]], null, null, [["sound effect", 10.58], ["music", 10.38], ["echo", 8.85]], [["civil defense siren", 44.66], ["speech", 19.32], ["siren", 14.61]], null, [["music", 86.36], ["speech", 4.11], ["didgeridoo", 1.14]], [["music", 87.31], ["singing", 2.55], ["beatboxing", 1.97]]], "duration": [2.99, 5.33, 0.15, -0.23, 11.71, 19.55, 13.1, 0.82, 1.86, 2.06, 2.22, 0.85, 6.06, 7.0]} \ No newline at end of file diff --git a/annotations_filtered/vKZhOw3Feo4_filtered.json b/annotations_filtered/vKZhOw3Feo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5722f67ca1613b8600ed822c5a25b8e32450f09b --- /dev/null +++ b/annotations_filtered/vKZhOw3Feo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.65], [36.0, 44.27], [61.0, 61.47]], "keep_status": [false, false, false], "silence_prob": [0.0, 36.02, 0.0], "audiomae_on_audioset": [null, [["speech", 41.54], ["music", 32.47], ["hum", 4.88]], null], "duration": [0.65, 8.27, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/vKcEalTIwfQ_filtered.json b/annotations_filtered/vKcEalTIwfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41b670417ed33f89ed6856537e0856d6d62836f --- /dev/null +++ b/annotations_filtered/vKcEalTIwfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [4.0, 4.38], [4.0, 5.12], [6.0, 6.52], [11.0, 13.64], [18.0, 28.07], [33.0, 32.93], [35.0, 42.96], [46.0, 46.68], [55.0, 56.2], [57.0, 63.31], [66.0, 67.02], [78.0, 79.46], [83.0, 82.97], [84.0, 85.09], [90.0, 90.91], [96.0, 96.47], [101.0, 100.89]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.72, 30.11, 0.0, 31.13, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 35.87], ["hum", 12.3], ["music", 10.69]], [["speech", 47.4], ["hum", 16.56], ["music", 9.1]], null, [["music", 41.49], ["hum", 14.87], ["throbbing", 9.89]], null, null, [["sidetone", 42.31], ["speech", 17.52], ["mains hum", 14.15]], null, null, null, null, null, null, null], "duration": [0.33, 0.38, 1.12, 0.52, 2.64, 10.07, -0.07, 7.96, 0.68, 1.2, 6.31, 1.02, 1.46, -0.03, 1.09, 0.91, 0.47, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/vKePn-57zAA_filtered.json b/annotations_filtered/vKePn-57zAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3302399a6e1312299ee875b6109bac58e6436964 --- /dev/null +++ b/annotations_filtered/vKePn-57zAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.21], [5.0, 6.47], [7.0, 17.69], [18.0, 19.63], [25.0, 25.22], [30.0, 29.57], [38.0, 38.8], [41.0, 42.01], [44.0, 47.82], [57.0, 57.59], [59.0, 59.27], [61.0, 64.17], [69.0, 69.2], [72.0, 72.87], [77.0, 92.01], [92.0, 93.02], [96.0, 97.58], [104.0, 105.33], [110.0, 118.37], [119.0, 119.85], [122.0, 122.69], [125.0, 128.17], [129.0, 130.65], [131.0, 136.16], [139.0, 140.39], [141.0, 141.08], [141.0, 142.75], [145.0, 150.85], [152.0, 154.14], [170.0, 171.05], [171.0, 198.85], [199.0, 200.91], [201.0, 207.13], [213.0, 214.15], [218.0, 227.87], [231.0, 232.98], [234.0, 234.2], [236.0, 237.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [83.16, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 75.07, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 96.17, 0.0, 84.98, 0.0, 0.0, 0.0, 87.92, 99.94, 0.0, 86.27, 0.0, 32.41, 0.0, 43.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.8], ["music", 32.71], ["sidetone", 7.94]], null, [["animal", 31.89], ["livestock, farm animals, working animals", 11.39], ["cattle, bovinae", 8.24]], null, null, null], "duration": [2.21, 1.47, 10.69, 1.63, 0.22, -0.43, 0.8, 1.01, 3.82, 0.59, 0.27, 3.17, 0.2, 0.87, 15.01, 1.02, 1.58, 1.33, 8.37, 0.85, 0.69, 3.17, 1.65, 5.16, 1.39, 0.08, 1.75, 5.85, 2.14, 1.05, 27.85, 1.91, 6.13, 1.15, 9.87, 1.98, 0.2, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/vKhAdR1G9io_filtered.json b/annotations_filtered/vKhAdR1G9io_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44268bac926839ea24b0662c6c2aa1fb42bfd983 --- /dev/null +++ b/annotations_filtered/vKhAdR1G9io_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [3.0, 4.08], [5.0, 8.18], [12.0, 15.5], [17.0, 18.22], [19.0, 19.67], [20.0, 22.01], [23.0, 25.05], [26.0, 27.4], [35.0, 36.75], [39.0, 40.17], [41.0, 42.25], [43.0, 43.88], [49.0, 48.95], [49.0, 49.4], [53.0, 56.22], [59.0, 63.27], [66.0, 67.41], [72.0, 72.27], [75.0, 78.29], [80.0, 83.81], [85.0, 86.0], [89.0, 89.31], [90.0, 90.39], [91.0, 91.77], [93.0, 99.0], [100.0, 100.6], [102.0, 104.18], [109.0, 111.35], [114.0, 114.74], [119.0, 119.57], [127.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 96.66, 97.92, 0.0, 0.0, 49.54, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.1, 75.72, 0.0, 0.0, 94.95, 97.11, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 45.85, 46.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 37.95], ["chirp tone", 29.14], ["tuning fork", 9.83]], [["sidetone", 26.79], ["speech", 22.39], ["telephone", 10.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.03], ["hum", 12.34], ["mains hum", 5.09]], null, [["speech", 17.51], ["fly, housefly", 13.5], ["mosquito", 8.37]], [["mains hum", 12.89], ["hum", 12.62], ["throbbing", 12.11]], null, null, null], "duration": [0.24, 1.08, 3.18, 3.5, 1.22, 0.67, 2.01, 2.05, 1.4, 1.75, 1.17, 1.25, 0.88, -0.05, 0.4, 3.22, 4.27, 1.41, 0.27, 3.29, 3.81, 1.0, 0.31, 0.39, 0.77, 6.0, 0.6, 2.18, 2.35, 0.74, 0.57, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/vKjBFsyYC0g_filtered.json b/annotations_filtered/vKjBFsyYC0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd9963e0e6c98e5cddb8fadb3b6a166bb18ab0d --- /dev/null +++ b/annotations_filtered/vKjBFsyYC0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.95], [20.0, 20.98], [23.0, 23.5], [29.0, 29.17], [30.0, 33.08], [37.0, 39.21], [41.0, 42.92], [45.0, 46.43], [47.0, 62.16], [63.0, 64.3], [68.0, 68.81], [76.0, 78.24], [84.0, 84.6], [89.0, 89.01], [113.0, 115.64]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 55.89, 45.27, 0.0, 0.0, 44.52, 0.0, 0.0, 63.85, 0.0, 0.0, 59.33], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 31.35], ["whale vocalization", 20.92], ["music", 11.0]], null, null, [["hum", 34.54], ["mains hum", 15.28], ["noise", 10.55]], null, null, null, null, null, null], "duration": [0.95, 0.98, 0.5, 0.17, 3.08, 2.21, 1.92, 1.43, 15.16, 1.3, 0.81, 2.24, 0.6, 0.01, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/vLAQiwEGGKs_filtered.json b/annotations_filtered/vLAQiwEGGKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05c5b464e58ec01d62dced0cf85c840d2b79a023 --- /dev/null +++ b/annotations_filtered/vLAQiwEGGKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 51.49], [53.0, 54.24], [57.0, 57.52], [62.0, 62.87], [66.0, 66.48], [70.0, 71.27], [73.0, 74.28], [76.0, 76.91], [78.0, 79.49], [81.0, 82.32], [83.0, 101.88]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [39.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.34], "audiomae_on_audioset": [[["hum", 23.98], ["eruption", 19.15], ["noise", 9.52]], null, null, null, null, null, null, null, null, null, [["radio", 22.14], ["white noise", 16.12], ["noise", 15.73]]], "duration": [4.49, 1.24, 0.52, 0.87, 0.48, 1.27, 1.28, 0.91, 1.49, 1.32, 18.88]} \ No newline at end of file diff --git a/annotations_filtered/vLXjWGI8sfw_filtered.json b/annotations_filtered/vLXjWGI8sfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1db5616052b6b83108e7b394fd22dd9400de498 --- /dev/null +++ b/annotations_filtered/vLXjWGI8sfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.5], [18.0, 24.43], [27.0, 28.05], [29.0, 30.11], [35.0, 35.72], [37.0, 40.22], [42.0, 43.11], [44.0, 44.83], [50.0, 51.21], [53.0, 53.32], [55.0, 55.05], [59.0, 59.41], [61.0, 62.16], [68.0, 69.06], [71.0, 71.98], [73.0, 74.12], [76.0, 78.56], [79.0, 80.86], [84.0, 84.35], [85.0, 91.32], [92.0, 93.04], [99.0, 99.59], [104.0, 103.99], [110.0, 112.94], [116.0, 118.83], [123.0, 128.85], [130.0, 131.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.92, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 46.12, 0.0, 0.0, 0.0, 84.25, 68.67, 43.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.72], ["bee, wasp, etc.", 18.87], ["insect", 12.02]], null, null, null, null, null, [["speech", 69.39], ["hum", 6.44], ["radio", 1.95]], null], "duration": [0.5, 6.43, 1.05, 1.11, 0.72, 3.22, 1.11, 0.83, 1.21, 0.32, 0.05, 0.41, 1.16, 1.06, 0.98, 1.12, 2.56, 1.86, 0.35, 6.32, 1.04, 0.59, -0.01, 2.94, 2.83, 5.85, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/vLgTWXjMlWI_filtered.json b/annotations_filtered/vLgTWXjMlWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a55d490f99089671f89fcb620506f6117d0418 --- /dev/null +++ b/annotations_filtered/vLgTWXjMlWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.49], [39.0, 40.59], [42.0, 43.28], [49.0, 49.69], [50.0, 54.89], [56.0, 58.55], [60.0, 62.56], [64.0, 68.5], [71.0, 71.22], [72.0, 72.91], [76.0, 77.84], [88.0, 88.5], [89.0, 89.67], [90.0, 90.26], [91.0, 91.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.78, 99.96, 99.93, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 1.59, 1.28, 0.69, 4.89, 2.55, 2.56, 4.5, 0.22, 0.91, 1.84, 0.5, 0.67, 0.26, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/vLt5ei598CY_filtered.json b/annotations_filtered/vLt5ei598CY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a751fedd8269ce0fe114b9c472245fab9567ae --- /dev/null +++ b/annotations_filtered/vLt5ei598CY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.32], [23.0, 28.0], [29.0, 30.16], [33.0, 36.1], [37.0, 37.94], [39.0, 40.53], [41.0, 52.2], [53.0, 53.03], [57.0, 57.99], [59.0, 60.88], [61.0, 62.31], [66.0, 69.8], [70.0, 70.78], [74.0, 85.6], [89.0, 89.94], [93.0, 106.42], [107.0, 108.35], [109.0, 109.51], [111.0, 113.54], [114.0, 116.56], [118.0, 119.52], [125.0, 141.35], [141.0, 146.1], [147.0, 153.69], [155.0, 155.53], [156.0, 158.94], [159.0, 159.39], [160.0, 160.78], [161.0, 161.49]], "keep_status": [true, true, false, true, false, false, true, false, false, false, false, true, false, true, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false], "silence_prob": [30.61, 31.24, 0.0, 49.73, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 31.13, 0.0, 34.51, 0.0, 31.53, 0.0, 0.0, 35.33, 34.08, 0.0, 30.15, 30.78, 29.72, 0.0, 30.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["electric shaver, electric razor", 14.07], ["music", 13.61], ["buzz", 5.18]], [["whale vocalization", 14.86], ["sheep", 13.66], ["civil defense siren", 11.77]], null, [["hum", 46.18], ["mains hum", 14.98], ["throbbing", 6.06]], null, null, [["vehicle", 22.98], ["boat, water vehicle", 7.27], ["aircraft", 4.93]], null, null, null, null, [["whack, thwack", 22.11], ["speech", 20.64], ["rumble", 7.53]], null, [["buzz", 36.11], ["hum", 13.22], ["speech", 10.77]], null, [["music", 65.78], ["theremin", 7.02], ["electronic music", 2.93]], null, null, [["mains hum", 16.84], ["whale vocalization", 14.24], ["hum", 10.56]], [["hum", 35.34], ["mains hum", 21.67], ["throbbing", 9.91]], null, [["speech", 26.81], ["music", 13.83], ["breaking", 8.42]], [["speech", 49.7], ["vehicle", 12.35], ["music", 8.85]], [["music", 42.06], ["speech", 18.75], ["buzz", 8.42]], null, [["cattle, bovinae", 32.4], ["livestock, farm animals, working animals", 24.83], ["moo", 13.6]], null, null, null], "duration": [18.32, 5.0, 1.16, 3.1, 0.94, 1.53, 11.2, 0.03, 0.99, 1.88, 1.31, 3.8, 0.78, 11.6, 0.94, 13.42, 1.35, 0.51, 2.54, 2.56, 1.52, 16.35, 5.1, 6.69, 0.53, 2.94, 0.39, 0.78, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/vLw24Xr1zKo_filtered.json b/annotations_filtered/vLw24Xr1zKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d7a546874128d0735db2f5910f96635d61452eb --- /dev/null +++ b/annotations_filtered/vLw24Xr1zKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.87], [14.0, 17.95], [23.0, 24.81], [26.0, 32.37], [37.0, 37.91], [43.0, 43.41], [46.0, 66.07], [71.0, 86.78], [88.0, 89.13], [119.0, 119.15], [119.0, 120.92], [122.0, 123.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.18, 0.0, 30.47, 0.0, 0.0, 30.05, 39.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 42.91], ["music", 35.93], ["explosion", 3.97]], null, null, [["speech", 71.6], ["music", 10.37], ["vehicle", 1.69]], [["speech", 46.83], ["music", 28.97], ["hum", 5.64]], null, null, null, null], "duration": [-0.13, 3.95, 1.81, 6.37, 0.91, 0.41, 20.07, 15.78, 1.13, 0.15, 1.92, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/vLxUYa47OXE_filtered.json b/annotations_filtered/vLxUYa47OXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf13524dc5cbbc61d771582153dad98032ac609a --- /dev/null +++ b/annotations_filtered/vLxUYa47OXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 5.07], [6.0, 7.05], [9.0, 9.04], [10.0, 10.77], [12.0, 12.18], [13.0, 13.66], [22.0, 23.68], [30.0, 31.18], [34.0, 36.36], [40.0, 40.41], [45.0, 45.82], [47.0, 47.56], [48.0, 49.5], [50.0, 51.04], [60.0, 60.44], [62.0, 62.21], [63.0, 81.51], [84.0, 85.99], [86.0, 87.27], [88.0, 90.32], [95.0, 98.86], [100.0, 102.78], [106.0, 107.23], [112.0, 112.35], [113.0, 114.03], [129.0, 129.86], [143.0, 146.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 99.97, 0.0, 0.0, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 1.07, 1.05, 0.04, 0.77, 0.18, 0.66, 1.68, 1.18, 2.36, 0.41, 0.82, 0.56, 1.5, 1.04, 0.44, 0.21, 18.51, 1.99, 1.27, 2.32, 3.86, 2.78, 1.23, 0.35, 1.03, 0.86, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/vM7QMLTm1so_filtered.json b/annotations_filtered/vM7QMLTm1so_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aae6356d745b18c6f9315b82ca3caac1a3660430 --- /dev/null +++ b/annotations_filtered/vM7QMLTm1so_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [8.0, 11.16], [12.0, 15.25], [22.0, 22.76], [23.0, 22.84], [29.0, 31.36], [34.0, 35.04], [37.0, 37.07], [39.0, 39.19], [45.0, 46.04], [48.0, 48.86], [50.0, 51.34], [55.0, 61.77], [64.0, 65.11], [85.0, 85.85], [94.0, 98.42], [99.0, 99.74], [100.0, 124.09], [125.0, 129.69], [131.0, 142.11], [162.0, 164.24], [166.0, 168.24], [173.0, 177.72], [178.0, 177.75], [178.0, 177.79], [178.0, 177.82], [179.0, 194.34], [207.0, 211.82]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 29.36, 39.35, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 31.48, 0.0, 30.96, 36.44, 32.6, 32.2, 31.78, 30.1, 0.0, 0.0, 0.0, 30.39, 35.35], "audiomae_on_audioset": [null, [["vehicle", 14.28], ["music", 12.82], ["aircraft", 10.38]], [["speech", 35.72], ["music", 15.67], ["hum", 5.93]], null, null, null, null, null, null, null, null, null, [["music", 30.9], ["explosion", 24.39], ["burst, pop", 12.74]], null, null, [["cattle, bovinae", 50.41], ["moo", 39.11], ["livestock, farm animals, working animals", 8.77]], null, [["music", 44.98], ["throbbing", 10.56], ["smash, crash", 6.63]], [["music", 48.5], ["trombone", 15.65], ["brass instrument", 11.54]], [["music", 40.61], ["groan", 27.33], ["whack, thwack", 11.53]], [["speech", 36.72], ["fart", 12.97], ["grunt", 3.43]], [["hum", 29.73], ["music", 22.83], ["throbbing", 20.38]], [["speech", 31.19], ["music", 26.22], ["throbbing", 2.07]], null, null, null, [["speech", 37.23], ["music", 27.24], ["whack, thwack", 6.78]], [["music", 59.03], ["hum", 4.43], ["electronic music", 3.16]]], "duration": [0.51, 3.16, 3.25, 0.76, -0.16, 2.36, 1.04, 0.07, 0.19, 1.04, 0.86, 1.34, 6.77, 1.11, 0.85, 4.42, 0.74, 24.09, 4.69, 11.11, 2.24, 2.24, 4.72, -0.25, -0.21, -0.18, 15.34, 4.82]} \ No newline at end of file diff --git a/annotations_filtered/vMwfVOf1-vM_filtered.json b/annotations_filtered/vMwfVOf1-vM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c56bb3d121a2297a5d5537831cae716b6d989c25 --- /dev/null +++ b/annotations_filtered/vMwfVOf1-vM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.55], [17.0, 17.79], [34.0, 33.76], [34.0, 38.94], [54.0, 54.9], [58.0, 58.35], [59.0, 59.88], [65.0, 68.64], [76.0, 75.96], [77.0, 77.55], [80.0, 81.72], [84.0, 86.32], [89.0, 89.13], [102.0, 102.44], [102.0, 102.61], [103.0, 102.68], [103.0, 102.73], [103.0, 102.78], [103.0, 104.09], [105.0, 104.7], [105.0, 105.95], [108.0, 109.68], [111.0, 111.54], [113.0, 113.51], [115.0, 116.58]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.68, 0.0, 0.0, 35.34, 0.0, 0.0, 0.0, 39.25, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 73.71], ["thunk", 6.71], ["inside, small room", 4.24]], null, null, [["speech", 65.33], ["music", 15.89], ["boing", 3.32]], null, null, null, [["music", 30.34], ["drum", 13.38], ["percussion", 10.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.55, 0.79, -0.24, 4.94, 0.9, 0.35, 0.88, 3.64, -0.04, 0.55, 1.72, 2.32, 0.13, 0.44, 0.61, -0.32, -0.27, -0.22, 1.09, -0.3, 0.95, 1.68, 0.54, 0.51, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/vNPCXKmF9LI_filtered.json b/annotations_filtered/vNPCXKmF9LI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da3b053ac83ceaf781b20d7140f7ef2d18094b6f --- /dev/null +++ b/annotations_filtered/vNPCXKmF9LI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [3.0, 4.53], [6.0, 6.29], [14.0, 15.08], [16.0, 16.85], [20.0, 20.11], [27.0, 28.39], [37.0, 37.49], [38.0, 38.28], [45.0, 46.57], [47.0, 47.51], [49.0, 50.58], [51.0, 52.22], [55.0, 55.14], [57.0, 57.16], [59.0, 59.59], [60.0, 62.82], [69.0, 69.57], [71.0, 71.88], [75.0, 77.36], [78.0, 78.54], [88.0, 89.36], [91.0, 91.32], [95.0, 99.0], [103.0, 106.81], [114.0, 115.43], [119.0, 119.37], [120.0, 122.77], [123.0, 130.59], [134.0, 135.58], [138.0, 142.3], [144.0, 144.19], [146.0, 169.59], [171.0, 172.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 53.22, 31.14, 0.0, 0.0, 39.57, 32.43, 0.0, 70.58, 0.0, 35.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.49], ["music", 15.34], ["gunshot, gunfire", 6.84]], null, null, [["music", 20.28], ["hum", 16.32], ["mains hum", 11.43]], [["speech", 42.68], ["music", 30.01], ["whack, thwack", 3.5]], null, null, null, [["music", 63.97], ["grunt", 5.55], ["breaking", 5.38]], null], "duration": [0.53, 1.53, 0.29, 1.08, 0.85, 0.11, 1.39, 0.49, 0.28, 1.57, 0.51, 1.58, 1.22, 0.14, 0.16, 0.59, 2.82, 0.57, 0.88, 2.36, 0.54, 1.36, 0.32, 4.0, 3.81, 1.43, 0.37, 2.77, 7.59, 1.58, 4.3, 0.19, 23.59, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/vN_HrPvTVIk_filtered.json b/annotations_filtered/vN_HrPvTVIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae2118f7cf1c50a1942c651f17c28b3190a58da7 --- /dev/null +++ b/annotations_filtered/vN_HrPvTVIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [6.0, 6.98], [9.0, 9.19], [11.0, 11.18], [13.0, 13.22], [14.0, 14.86], [23.0, 22.82], [24.0, 24.33], [25.0, 26.23], [29.0, 29.62], [31.0, 32.73], [33.0, 35.38], [48.0, 51.81], [58.0, 63.19], [68.0, 76.15], [80.0, 81.24], [82.0, 83.81], [85.0, 86.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.89, 30.2, 32.37, 37.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.5], ["telephone", 7.45], ["busy signal", 2.57]], [["speech", 74.78], ["skateboard", 2.91], ["honk", 1.93]], [["speech", 75.52], ["animal", 2.92], ["dog", 1.74]], [["fly, housefly", 49.44], ["insect", 26.5], ["bee, wasp, etc.", 12.47]], null, null, null], "duration": [0.3, 0.98, 0.19, 0.18, 0.22, 0.86, -0.18, 0.33, 1.23, 0.62, 1.73, 2.38, 3.81, 5.19, 8.15, 1.24, 1.81, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/vO2jvLIyIV4_filtered.json b/annotations_filtered/vO2jvLIyIV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3473e421d3ba348e34e8db99ed97ef654973f0b7 --- /dev/null +++ b/annotations_filtered/vO2jvLIyIV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.09], [6.0, 7.1], [9.0, 10.74], [16.0, 16.33], [17.0, 18.37], [28.0, 29.59], [31.0, 32.93], [35.0, 35.83], [41.0, 41.76], [45.0, 46.89], [48.0, 48.78], [50.0, 72.54], [74.0, 76.87], [79.0, 79.05], [84.0, 84.7], [85.0, 90.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 73.21, 0.0, 0.0, 41.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 56.04], ["throbbing", 17.67], ["mains hum", 11.61]], null, null, null, [["bee, wasp, etc.", 27.5], ["insect", 19.28], ["speech", 14.18]]], "duration": [0.09, 1.1, 1.74, 0.33, 1.37, 1.59, 1.93, 0.83, 0.76, 1.89, 0.78, 22.54, 2.87, 0.05, 0.7, 5.36]} \ No newline at end of file diff --git a/annotations_filtered/vOQ211AFtLU_filtered.json b/annotations_filtered/vOQ211AFtLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ea773b90a6cd86292bd832bfe8d6627aa29b55d --- /dev/null +++ b/annotations_filtered/vOQ211AFtLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.71], [25.0, 29.94], [31.0, 36.54], [38.0, 40.66], [41.0, 57.35], [58.0, 59.83], [61.0, 61.65], [65.0, 69.97], [71.0, 75.69], [77.0, 99.54], [101.0, 101.14], [103.0, 104.35], [106.0, 107.42], [109.0, 110.37], [112.0, 112.7], [115.0, 116.41], [117.0, 119.11]], "keep_status": [false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 82.79, 76.37, 89.19, 47.9, 0.0, 0.0, 37.32, 57.09, 32.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.06], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 24.06], ["music", 21.51], ["hum", 20.1]], null, null, [["hum", 38.19], ["music", 19.84], ["mains hum", 8.03]], null, [["music", 15.61], ["explosion", 15.07], ["hum", 8.15]], null, null, null, null, null, null, [["music", 42.88], ["speech", 14.63], ["hum", 12.14]]], "duration": [1.71, 4.94, 5.54, 2.66, 16.35, 1.83, 0.65, 4.97, 4.69, 22.54, 0.14, 1.35, 1.42, 1.37, 0.7, 1.41, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/vOTtCjGqXYo_filtered.json b/annotations_filtered/vOTtCjGqXYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5998237a51d51266460e919851856383998ae157 --- /dev/null +++ b/annotations_filtered/vOTtCjGqXYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.76], [27.0, 28.9], [29.0, 29.62], [30.0, 34.74], [40.0, 41.3], [45.0, 46.08], [49.0, 52.91], [53.0, 52.98], [73.0, 76.23], [76.0, 76.27], [77.0, 78.75], [81.0, 83.24], [85.0, 87.66], [90.0, 91.98], [94.0, 96.15], [99.0, 116.85], [117.0, 117.22], [119.0, 119.65], [121.0, 123.7], [139.0, 138.82], [139.0, 144.26], [179.0, 212.33]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.36, 0.0, 0.0, 30.71, 0.0, 29.65, 0.0, 0.0, 31.6, 30.55, 0.0, 32.1, 29.72, 0.0, 0.0, 29.53, 0.0, 30.31, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.04], ["afrobeat", 7.26], ["moo", 6.51]], null, null, [["music", 60.41], ["didgeridoo", 3.53], ["funk", 2.54]], null, [["music", 59.81], ["musical instrument", 6.31], ["carnatic music", 5.04]], null, null, [["music", 39.25], ["livestock, farm animals, working animals", 16.98], ["cattle, bovinae", 15.34]], [["moo", 37.77], ["cattle, bovinae", 37.62], ["livestock, farm animals, working animals", 15.97]], null, [["music", 41.2], ["guitar", 9.46], ["musical instrument", 7.53]], [["music", 50.25], ["moo", 8.6], ["cattle, bovinae", 7.69]], null, null, [["music", 58.26], ["mantra", 8.74], ["chant", 3.88]], null, [["music", 62.82], ["carnatic music", 11.57], ["musical instrument", 4.79]], null], "duration": [0.76, 1.9, 0.62, 4.74, 1.3, 1.08, 3.91, -0.02, 3.23, 0.27, 1.75, 2.24, 2.66, 1.98, 2.15, 17.85, 0.22, 0.65, 2.7, -0.18, 5.26, 33.33]} \ No newline at end of file diff --git a/annotations_filtered/vOfFVhSiwiA_filtered.json b/annotations_filtered/vOfFVhSiwiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a3a27da2d82fe3ca8bc5ce11bb287dac15eaee --- /dev/null +++ b/annotations_filtered/vOfFVhSiwiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.07], [25.0, 26.28], [27.0, 33.61], [35.0, 35.87], [39.0, 43.16], [44.0, 44.86], [45.0, 50.04], [50.0, 63.0], [63.0, 80.3], [82.0, 121.63]], "keep_status": [true, false, true, false, true, false, true, false, false, false], "silence_prob": [37.14, 0.0, 40.36, 0.0, 37.55, 0.0, 34.53, 33.45, 28.6, 0.0], "audiomae_on_audioset": [[["music", 39.89], ["hum", 13.11], ["throbbing", 5.6]], null, [["music", 19.29], ["hum", 13.0], ["mains hum", 12.58]], null, [["music", 39.82], ["didgeridoo", 7.54], ["livestock, farm animals, working animals", 6.43]], null, [["hum", 21.68], ["music", 20.47], ["mains hum", 18.66]], [["music", 48.47], ["hum", 17.22], ["throbbing", 8.95]], [["hum", 36.52], ["music", 23.32], ["throbbing", 22.91]], null], "duration": [5.07, 1.28, 6.61, 0.87, 4.16, 0.86, 5.04, 13.0, 17.3, 39.63]} \ No newline at end of file diff --git a/annotations_filtered/vOnWEmbW3OQ_filtered.json b/annotations_filtered/vOnWEmbW3OQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe1a69952a35c9f9a37194192bd9835dd1a1e7b7 --- /dev/null +++ b/annotations_filtered/vOnWEmbW3OQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [8.0, 10.4], [11.0, 13.69], [15.0, 15.23], [16.0, 32.8], [34.0, 35.51], [49.0, 51.36], [53.0, 54.33], [55.0, 55.48], [62.0, 77.04], [82.0, 98.41], [100.0, 112.11], [115.0, 116.46]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 53.53, 56.86, 0.0, 58.64, 0.0, 50.97, 0.0, 0.0, 32.13, 29.83, 29.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 38.27], ["music", 25.04], ["outside, rural or natural", 4.58]], [["music", 17.67], ["mains hum", 17.34], ["hum", 11.98]], [["music", 44.76], ["throbbing", 9.91], ["hum", 6.57]], null], "duration": [0.8, 2.4, 2.69, 0.23, 16.8, 1.51, 2.36, 1.33, 0.48, 15.04, 16.41, 12.11, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/vOoyaqLrZnE_filtered.json b/annotations_filtered/vOoyaqLrZnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba67ae5e584e01eafdfeb32c3b8c82990aa1939a --- /dev/null +++ b/annotations_filtered/vOoyaqLrZnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.27], [5.0, 10.79], [12.0, 19.18], [20.0, 21.17], [22.0, 25.02], [27.0, 30.64], [32.0, 32.43], [33.0, 38.4], [39.0, 45.99], [47.0, 47.88], [51.0, 55.49], [58.0, 59.12], [60.0, 61.64], [63.0, 65.45], [68.0, 70.04], [75.0, 75.09], [76.0, 76.52], [78.0, 78.87], [79.0, 79.91], [81.0, 98.49], [104.0, 105.81], [107.0, 108.41], [112.0, 112.62], [113.0, 113.48], [115.0, 115.26], [117.0, 117.53], [122.0, 122.64], [125.0, 125.0], [130.0, 130.44], [136.0, 136.71], [138.0, 140.21], [142.0, 143.63]], "keep_status": [true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.87, 38.43, 50.66, 0.0, 50.76, 61.77, 0.0, 42.28, 34.7, 0.0, 54.1, 0.0, 0.0, 31.73, 33.74, 0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0], "audiomae_on_audioset": [[["speech", 16.46], ["music", 12.65], ["throbbing", 9.63]], [["hum", 20.29], ["speech", 19.26], ["mains hum", 14.86]], null, null, null, null, null, [["speech", 29.15], ["didgeridoo", 24.59], ["music", 15.25]], [["thunk", 51.75], ["clang", 9.55], ["ding", 6.42]], null, null, null, null, [["speech", 54.75], ["dial tone", 29.51], ["busy signal", 3.41]], [["speech", 64.55], ["sine wave", 5.34], ["dial tone", 4.5]], null, null, null, null, [["music", 29.07], ["hum", 22.6], ["mains hum", 13.6]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 5.79, 7.18, 1.17, 3.02, 3.64, 0.43, 5.4, 6.99, 0.88, 4.49, 1.12, 1.64, 2.45, 2.04, 0.09, 0.52, 0.87, 0.91, 17.49, 1.81, 1.41, 0.62, 0.48, 0.26, 0.53, 0.64, 0.0, 0.44, 0.71, 2.21, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/vP7uKAQLwXc_filtered.json b/annotations_filtered/vP7uKAQLwXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..296a3e7fbf10737fe357978bb908baa93d32808c --- /dev/null +++ b/annotations_filtered/vP7uKAQLwXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 32.0], [37.0, 43.51], [45.0, 52.05], [54.0, 56.27], [60.0, 86.93]], "keep_status": [false, false, true, true, false], "silence_prob": [28.84, 28.7, 28.39, 28.79, 34.71], "audiomae_on_audioset": [[["music", 38.03], ["vehicle", 26.22], ["car", 19.26]], [["vehicle", 47.55], ["car", 16.4], ["music", 11.21]], [["vehicle", 37.51], ["car", 17.0], ["skidding", 13.39]], [["didgeridoo", 40.15], ["music", 17.69], ["hum", 6.94]], [["music", 46.56], ["hum", 15.29], ["mains hum", 8.68]]], "duration": [23.0, 6.51, 7.05, 2.27, 26.93]} \ No newline at end of file diff --git a/annotations_filtered/vP8C80lIRt0_filtered.json b/annotations_filtered/vP8C80lIRt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fa3ec126d37c45a3b7f504db6adce5e26366471 --- /dev/null +++ b/annotations_filtered/vP8C80lIRt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [3.0, 2.93], [6.0, 7.52], [14.0, 14.81], [16.0, 20.39], [24.0, 25.93], [29.0, 29.46], [30.0, 31.82], [34.0, 34.3], [35.0, 38.18], [47.0, 49.89], [55.0, 57.2], [65.0, 65.64], [72.0, 75.39], [78.0, 79.62], [84.0, 85.73], [92.0, 93.51]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.36, 0.0, 0.0, 0.0, 0.0, 41.93, 33.95, 35.31, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 67.55], ["hum", 12.06], ["throbbing", 8.16]], null, null, null, null, [["music", 32.53], ["speech", 23.07], ["throbbing", 5.49]], [["cattle, bovinae", 39.52], ["moo", 36.79], ["livestock, farm animals, working animals", 23.28]], [["whale vocalization", 16.74], ["noise", 16.24], ["music", 9.88]], null, null, null, null, null], "duration": [0.36, -0.07, 1.52, 0.81, 4.39, 1.93, 0.46, 1.82, 0.3, 3.18, 2.89, 2.2, 0.64, 3.39, 1.62, 1.73, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/vPB2g1y2VFk_filtered.json b/annotations_filtered/vPB2g1y2VFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0136c68ce94d3162154edd455251bb5bf52aa91 --- /dev/null +++ b/annotations_filtered/vPB2g1y2VFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [4.0, 6.0], [10.0, 16.21], [18.0, 19.36], [22.0, 24.53], [29.0, 29.15], [33.0, 34.38], [36.0, 36.34], [37.0, 38.16], [43.0, 49.11], [53.0, 53.77], [57.0, 57.43], [61.0, 65.72], [68.0, 68.61], [74.0, 74.73], [76.0, 77.41], [80.0, 80.23], [83.0, 87.12], [89.0, 89.31], [89.0, 89.7], [91.0, 91.47], [102.0, 103.08], [104.0, 105.16], [107.0, 107.45], [109.0, 110.03], [114.0, 114.1]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.33, 36.43, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 34.93, 0.0, 0.0, 30.88, 0.0, 0.0, 0.0, 0.0, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 30.83], ["throbbing", 19.79], ["music", 14.93]], null, null, null, null, null, null, [["hum", 26.98], ["speech", 18.02], ["noise", 10.05]], null, null, [["speech", 27.48], ["firecracker", 26.44], ["burst, pop", 13.42]], null, null, null, null, [["speech", 52.15], ["fart", 6.72], ["burst, pop", 5.25]], null, null, null, null, null, null, null, null], "duration": [0.38, 2.0, 6.21, 1.36, 2.53, 0.15, 1.38, 0.34, 1.16, 6.11, 0.77, 0.43, 4.72, 0.61, 0.73, 1.41, 0.23, 4.12, 0.31, 0.7, 0.47, 1.08, 1.16, 0.45, 1.03, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/vPTTP3gSLJc_filtered.json b/annotations_filtered/vPTTP3gSLJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09469e97b1fe4a4e244bbd6a294afb89b0126776 --- /dev/null +++ b/annotations_filtered/vPTTP3gSLJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 91.25], [93.0, 116.24]], "keep_status": [false, false], "silence_prob": [0.0, 29.91], "audiomae_on_audioset": [null, [["music", 64.63], ["hum", 5.71], ["scary music", 5.3]]], "duration": [60.25, 23.24]} \ No newline at end of file diff --git a/annotations_filtered/vPYiq9JNq_c_filtered.json b/annotations_filtered/vPYiq9JNq_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee73cbbbf345a89e8371fb87897e53963f2c50f6 --- /dev/null +++ b/annotations_filtered/vPYiq9JNq_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [26.0, 26.65], [27.0, 28.76], [29.0, 36.31], [40.0, 43.09], [48.0, 48.44], [51.0, 51.76], [53.0, 53.5], [59.0, 60.39], [65.0, 65.55], [72.0, 73.33], [76.0, 76.5], [95.0, 95.34], [100.0, 100.89], [103.0, 111.86], [112.0, 112.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.89, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 67.66], ["music", 7.89], ["fireworks", 5.77]], [["speech", 47.04], ["cheering", 7.45], ["throbbing", 7.31]], null, null, null, null, null, null, null, null, null, [["speech", 53.1], ["hum", 9.56], ["explosion", 7.78]], null], "duration": [0.38, 0.65, 1.76, 7.31, 3.09, 0.44, 0.76, 0.5, 1.39, 0.55, 1.33, 0.5, 0.34, 0.89, 8.86, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/vPs5yv77m9Y_filtered.json b/annotations_filtered/vPs5yv77m9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/vPs5yv77m9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/vQLNS3HWfCM_filtered.json b/annotations_filtered/vQLNS3HWfCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0799ca59ad8e4c841264b8922eb287dbcb689199 --- /dev/null +++ b/annotations_filtered/vQLNS3HWfCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.61], [5.0, 13.34], [15.0, 15.65], [18.0, 18.66], [19.0, 26.72], [28.0, 28.44], [29.0, 32.93], [34.0, 35.61], [37.0, 44.79], [48.0, 48.1], [49.0, 49.1]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.6, 0.0, 0.0, 34.94, 0.0, 30.46, 0.0, 30.48, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.8], ["theremin", 34.77], ["whale vocalization", 3.34]], null, null, [["music", 50.96], ["gong", 15.09], ["theremin", 12.54]], null, [["music", 39.85], ["theremin", 19.22], ["foghorn", 8.17]], null, [["theremin", 54.95], ["music", 28.37], ["foghorn", 3.73]], null, null], "duration": [1.61, 8.34, 0.65, 0.66, 7.72, 0.44, 3.93, 1.61, 7.79, 0.1, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/vQSkLuEOdMM_filtered.json b/annotations_filtered/vQSkLuEOdMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2023f178f0c8f3b1237d6825c3d0d5d4fa314cb --- /dev/null +++ b/annotations_filtered/vQSkLuEOdMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [8.0, 9.12], [10.0, 11.92], [14.0, 14.39], [15.0, 14.93], [16.0, 17.36], [18.0, 20.09], [21.0, 21.14], [22.0, 22.03], [23.0, 23.09], [24.0, 25.79], [29.0, 29.13], [30.0, 31.9], [33.0, 32.85], [35.0, 35.85], [37.0, 37.52], [38.0, 39.39], [43.0, 44.42], [47.0, 54.72], [56.0, 55.93], [61.0, 63.49], [66.0, 66.21], [67.0, 76.98], [77.0, 80.55], [86.0, 86.63], [88.0, 88.77], [90.0, 91.07], [93.0, 93.12], [95.0, 98.1], [100.0, 99.93], [102.0, 102.24], [103.0, 103.45], [104.0, 105.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 0.0, 51.18, 0.0, 30.87, 47.46, 0.0, 0.0, 0.0, 0.0, 41.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.83], ["speech", 11.91], ["smash, crash", 9.88]], [["speech", 30.09], ["sine wave", 20.15], ["chirp tone", 12.83]], null, null, null, null, [["noise", 18.04], ["smash, crash", 10.23], ["hum", 8.33]], null, null, null, null], "duration": [0.56, 1.12, 1.92, 0.39, -0.07, 1.36, 2.09, 0.14, 0.03, 0.09, 1.79, 0.13, 1.9, -0.15, 0.85, 0.52, 1.39, 1.42, 7.72, -0.07, 2.49, 0.21, 9.98, 3.55, 0.63, 0.77, 1.07, 0.12, 3.1, -0.07, 0.24, 0.45, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/vQWmd8REdaE_filtered.json b/annotations_filtered/vQWmd8REdaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3945dfc58c26f594268cfbf64886dba1dc7a200 --- /dev/null +++ b/annotations_filtered/vQWmd8REdaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [6.0, 6.62], [7.0, 21.14], [23.0, 26.15], [26.0, 34.84], [35.0, 38.65], [39.0, 105.33]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 30.44, 33.16, 30.75, 34.05, 0.0], "audiomae_on_audioset": [null, null, [["speech", 35.32], ["music", 33.16], ["musical instrument", 6.67]], [["hum", 38.7], ["throbbing", 20.82], ["speech", 6.4]], [["music", 50.47], ["speech", 32.22], ["hum", 2.38]], [["music", 42.18], ["speech", 27.36], ["whale vocalization", 6.76]], null], "duration": [0.68, 0.62, 14.14, 3.15, 8.84, 3.65, 66.33]} \ No newline at end of file diff --git a/annotations_filtered/vQdFnS_u8UM_filtered.json b/annotations_filtered/vQdFnS_u8UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aba7094d8cd25054fc8a964d00bcf5ef64e9172d --- /dev/null +++ b/annotations_filtered/vQdFnS_u8UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [4.0, 5.61], [7.0, 8.5], [10.0, 11.23], [15.0, 15.53], [19.0, 19.9], [23.0, 24.71], [28.0, 28.58], [32.0, 33.81], [35.0, 35.73], [37.0, 37.93], [39.0, 39.78], [43.0, 45.15], [46.0, 48.66], [52.0, 52.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.6, 63.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.41], ["quack", 20.92], ["duck", 16.31]], null, null], "duration": [0.45, 1.61, 1.5, 1.23, 0.53, 0.9, 1.71, 0.58, 1.81, 0.73, 0.93, 0.78, 2.15, 2.66, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/vQyK7Re2-Jc_filtered.json b/annotations_filtered/vQyK7Re2-Jc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad36a40c7c2adb695d6e956f02b986a8248dcf04 --- /dev/null +++ b/annotations_filtered/vQyK7Re2-Jc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.51], [8.0, 8.07], [11.0, 10.98], [11.0, 20.38], [22.0, 26.0], [32.0, 39.19], [39.0, 56.78], [57.0, 65.6], [66.0, 75.57], [76.0, 77.75], [79.0, 84.06], [88.0, 94.44], [98.0, 102.51], [104.0, 110.69], [112.0, 126.12]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [37.17, 0.0, 0.0, 38.4, 39.58, 34.92, 31.59, 31.91, 30.43, 0.0, 30.25, 33.23, 43.69, 33.37, 32.51], "audiomae_on_audioset": [[["cattle, bovinae", 17.02], ["moo", 15.71], ["music", 11.23]], null, null, [["music", 70.64], ["didgeridoo", 9.71], ["musical instrument", 5.74]], [["music", 75.11], ["musical instrument", 6.49], ["didgeridoo", 3.2]], [["music", 53.99], ["speech", 6.22], ["animal", 3.96]], [["music", 70.36], ["musical instrument", 7.22], ["guitar", 6.53]], [["music", 83.47], ["didgeridoo", 1.16], ["song", 1.12]], [["music", 74.94], ["singing", 3.18], ["musical instrument", 2.71]], null, [["music", 70.47], ["singing", 8.1], ["musical instrument", 3.51]], [["music", 88.09], ["musical instrument", 3.29], ["guitar", 1.57]], [["music", 49.33], ["boing", 31.98], ["speech", 1.58]], [["music", 82.94], ["synthesizer", 2.7], ["singing", 2.08]], [["music", 85.24], ["singing", 3.74], ["musical instrument", 1.33]]], "duration": [3.51, 0.07, -0.02, 9.38, 4.0, 7.19, 17.78, 8.6, 9.57, 1.75, 5.06, 6.44, 4.51, 6.69, 14.12]} \ No newline at end of file diff --git a/annotations_filtered/vR1WPNzcXHE_filtered.json b/annotations_filtered/vR1WPNzcXHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d181f5faab93ba8a4460168c81fbf1a7c67e3fcc --- /dev/null +++ b/annotations_filtered/vR1WPNzcXHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [16.0, 16.77], [21.0, 20.75], [50.0, 51.09], [60.0, 60.37], [74.0, 74.53], [82.0, 82.71], [88.0, 88.03], [101.0, 101.01], [103.0, 103.54], [106.0, 106.22], [111.0, 111.23], [113.0, 113.16], [125.0, 125.41], [126.0, 126.98], [129.0, 130.33], [131.0, 136.02], [136.0, 138.81], [146.0, 149.93], [152.0, 154.48], [156.0, 157.81], [163.0, 163.19], [169.0, 171.27], [173.0, 174.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 83.52, 76.04, 54.1, 0.0, 0.0, 60.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.77, -0.25, 1.09, 0.37, 0.53, 0.71, 0.03, 0.01, 0.54, 0.22, 0.23, 0.16, 0.41, 0.98, 1.33, 5.02, 2.81, 3.93, 2.48, 1.81, 0.19, 2.27, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/vR3FPplcJGg_filtered.json b/annotations_filtered/vR3FPplcJGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c38068bc552e936728ad295a2f3d571180ee7b5 --- /dev/null +++ b/annotations_filtered/vR3FPplcJGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 65.48], [66.0, 65.55], [66.0, 72.25], [73.0, 74.88], [76.0, 106.51], [107.0, 122.13]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.28, 0.0, 0.0, 43.03], "audiomae_on_audioset": [null, null, [["hum", 38.9], ["mains hum", 26.23], ["music", 10.43]], null, null, [["noise", 22.31], ["radio", 13.88], ["animal", 8.89]]], "duration": [63.48, -0.45, 6.25, 1.88, 30.51, 15.13]} \ No newline at end of file diff --git a/annotations_filtered/vRJ5cCP0ZPE_filtered.json b/annotations_filtered/vRJ5cCP0ZPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..975771e20a63dc84b7396846c6c488403ee1956f --- /dev/null +++ b/annotations_filtered/vRJ5cCP0ZPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.08], [5.0, 5.63], [8.0, 8.68], [11.0, 11.5], [14.0, 15.36], [17.0, 20.07], [22.0, 23.79], [29.0, 30.4], [32.0, 33.13], [36.0, 37.08], [40.0, 40.41], [41.0, 43.21], [46.0, 46.65], [50.0, 51.29], [55.0, 55.44], [58.0, 58.89], [61.0, 61.7], [66.0, 66.97], [71.0, 73.4], [75.0, 76.6], [81.0, 82.02], [84.0, 85.77], [91.0, 92.31], [94.0, 95.08], [97.0, 97.98], [99.0, 99.45], [101.0, 102.57], [103.0, 105.31], [106.0, 107.13], [108.0, 109.07], [111.0, 112.04], [114.0, 114.1], [115.0, 116.4], [116.0, 118.07], [119.0, 121.49], [122.0, 125.15], [126.0, 126.86], [128.0, 131.87], [134.0, 137.39], [143.0, 144.54], [147.0, 148.74], [150.0, 152.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 46.72, 42.79, 37.53, 0.0, 52.62, 57.01, 0.0, 0.0, 48.56], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 59.96], ["mains hum", 9.62], ["eruption", 4.87]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.09], ["fly, housefly", 11.62], ["hum", 6.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 53.82], ["speech", 12.93], ["fly, housefly", 9.15]], [["hum", 41.41], ["mains hum", 25.61], ["throbbing", 13.64]], [["hum", 20.95], ["speech", 15.8], ["sidetone", 15.14]], null, null, null, null, null, [["music", 8.96], ["rain on surface", 8.87], ["rain", 8.81]]], "duration": [0.08, 0.63, 0.68, 0.5, 1.36, 3.07, 1.79, 1.4, 1.13, 1.08, 0.41, 2.21, 0.65, 1.29, 0.44, 0.89, 0.7, 0.97, 2.4, 1.6, 1.02, 1.77, 1.31, 1.08, 0.98, 0.45, 1.57, 2.31, 1.13, 1.07, 1.04, 0.1, 1.4, 2.07, 2.49, 3.15, 0.86, 3.87, 3.39, 1.54, 1.74, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/vRUQ_q5mivc_filtered.json b/annotations_filtered/vRUQ_q5mivc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e2ffb10a50468499dd711810f042376b7bb5f0 --- /dev/null +++ b/annotations_filtered/vRUQ_q5mivc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [10.0, 12.48], [13.0, 22.94], [24.0, 30.35], [40.0, 42.06], [44.0, 45.23], [46.0, 62.78], [70.0, 83.3], [84.0, 87.34], [88.0, 88.94], [90.0, 94.29], [96.0, 96.52], [100.0, 120.61], [122.0, 131.13], [133.0, 173.85]], "keep_status": [false, false, true, true, true, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 35.0, 30.08, 29.79, 32.15, 0.0, 30.63, 31.61, 32.84, 0.0, 44.93, 0.0, 35.42, 32.97, 0.0], "audiomae_on_audioset": [null, [["mains hum", 37.51], ["hum", 33.43], ["music", 10.78]], [["sidetone", 24.17], ["fly, housefly", 18.8], ["insect", 11.14]], [["speech", 44.71], ["music", 16.7], ["hum", 7.53]], [["moo", 25.9], ["cattle, bovinae", 21.39], ["livestock, farm animals, working animals", 16.19]], null, [["music", 57.72], ["speech", 14.65], ["theremin", 9.55]], [["fly, housefly", 22.24], ["music", 19.62], ["speech", 6.89]], [["speech", 33.67], ["music", 25.56], ["synthesizer", 4.68]], null, [["whale vocalization", 51.76], ["hum", 9.54], ["music", 9.41]], null, [["music", 50.71], ["ambient music", 7.09], ["hum", 6.78]], [["music", 40.33], ["didgeridoo", 14.01], ["throbbing", 13.27]], null], "duration": [0.1, 2.48, 9.94, 6.35, 2.06, 1.23, 16.78, 13.3, 3.34, 0.94, 4.29, 0.52, 20.61, 9.13, 40.85]} \ No newline at end of file diff --git a/annotations_filtered/vRXk74BCp-Q_filtered.json b/annotations_filtered/vRXk74BCp-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1deb39b749994ac83ef588cc3c44d51d0ad719d0 --- /dev/null +++ b/annotations_filtered/vRXk74BCp-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [93.0, 98.2], [102.0, 103.74], [120.0, 120.58]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 30.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fart", 66.06], ["music", 21.11], ["speech", 2.77]], null, null], "duration": [1.43, 5.2, 1.74, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/vR_L-yH_3jY_filtered.json b/annotations_filtered/vR_L-yH_3jY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da0cc36d8a090dd37a8a59419edb89a73edf4ae4 --- /dev/null +++ b/annotations_filtered/vR_L-yH_3jY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [16.0, 16.5], [18.0, 18.55], [24.0, 24.54], [31.0, 30.81], [33.0, 33.69], [37.0, 37.45], [39.0, 40.19], [42.0, 42.31], [49.0, 51.14], [53.0, 53.08], [54.0, 55.0], [58.0, 58.36], [59.0, 65.13], [67.0, 70.95], [76.0, 76.96], [80.0, 81.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 0.0, 70.02, 67.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 0.5, 0.55, 0.54, -0.19, 0.69, 0.45, 1.19, 0.31, 2.14, 0.08, 1.0, 0.36, 6.13, 3.95, 0.96, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/vRaCv5oNQ3w_filtered.json b/annotations_filtered/vRaCv5oNQ3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3557bb1073f308201132f2920d7fc9690eb19e --- /dev/null +++ b/annotations_filtered/vRaCv5oNQ3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.57], [10.0, 10.34], [11.0, 15.53], [22.0, 25.2], [42.0, 42.55], [51.0, 53.67], [64.0, 64.76], [69.0, 72.52], [73.0, 72.57], [73.0, 74.24], [74.0, 80.37], [82.0, 83.47], [86.0, 86.81], [88.0, 88.21], [89.0, 90.29], [94.0, 95.17], [96.0, 103.89], [106.0, 105.8], [109.0, 115.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.5, 32.01, 0.0, 33.21, 0.0, 30.46, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 33.7], "audiomae_on_audioset": [null, null, [["music", 84.18], ["speech", 6.5], ["synthesizer", 1.75]], [["music", 61.11], ["hum", 9.84], ["throbbing", 6.15]], null, [["music", 38.94], ["throbbing", 23.2], ["hum", 12.09]], null, [["music", 60.29], ["musical instrument", 6.79], ["percussion", 5.09]], null, null, null, null, null, null, null, null, [["music", 63.88], ["musical instrument", 6.94], ["speech", 5.95]], null, [["music", 55.67], ["speech", 16.84], ["synthesizer", 4.39]]], "duration": [0.57, 0.34, 4.53, 3.2, 0.55, 2.67, 0.76, 3.52, -0.43, 1.24, 6.37, 1.47, 0.81, 0.21, 1.29, 1.17, 7.89, -0.2, 6.16]} \ No newline at end of file diff --git a/annotations_filtered/vSBQt-6fDr8_filtered.json b/annotations_filtered/vSBQt-6fDr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..365b5e5fe06a02b8e0c7092401420bb6d65defe8 --- /dev/null +++ b/annotations_filtered/vSBQt-6fDr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 54.36], [55.0, 55.46], [62.0, 62.01], [65.0, 65.5], [66.0, 67.05], [68.0, 68.17], [69.0, 70.51], [72.0, 72.44], [74.0, 76.11], [77.0, 79.05], [81.0, 81.63], [83.0, 85.02], [102.0, 109.04], [111.0, 111.35], [112.0, 114.61], [117.0, 121.66], [122.0, 121.69], [122.0, 121.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 64.18, 0.0, 59.96, 58.55, 0.0, 71.29, 51.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.46, 0.01, 0.5, 1.05, 0.17, 1.51, 0.44, 2.11, 2.05, 0.63, 2.02, 7.04, 0.35, 2.61, 4.66, -0.31, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/vSjkkQ6Bfc4_filtered.json b/annotations_filtered/vSjkkQ6Bfc4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f8736bfcda82154eaa16e3a2fb3dcb9301b50ac --- /dev/null +++ b/annotations_filtered/vSjkkQ6Bfc4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.23], [12.0, 13.14], [14.0, 15.11], [20.0, 22.44], [27.0, 40.44], [42.0, 53.42], [54.0, 58.09], [64.0, 64.99], [69.0, 71.39], [82.0, 84.97], [85.0, 85.65], [86.0, 88.05], [90.0, 92.7]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 42.98, 37.4, 36.71, 38.11, 0.0, 35.64, 34.85, 0.0, 35.44, 36.02], "audiomae_on_audioset": [null, null, null, [["music", 60.2], ["guitar", 8.87], ["effects unit", 6.08]], [["music", 38.17], ["speech", 32.37], ["inside, small room", 4.96]], [["music", 23.59], ["mechanisms", 22.66], ["gears", 14.02]], [["music", 55.44], ["theremin", 19.74], ["speech", 4.36]], null, [["frog", 23.29], ["music", 17.45], ["mains hum", 16.42]], [["mains hum", 24.61], ["speech", 19.75], ["music", 19.53]], null, [["mains hum", 42.89], ["hum", 25.34], ["music", 10.39]], [["music", 54.6], ["scary music", 7.37], ["gong", 5.19]]], "duration": [0.23, 1.14, 1.11, 2.44, 13.44, 11.42, 4.09, 0.99, 2.39, 2.97, 0.65, 2.05, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/vSt6OezOAwg_filtered.json b/annotations_filtered/vSt6OezOAwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb8daf9909a7723841f9275c509e5249f267783e --- /dev/null +++ b/annotations_filtered/vSt6OezOAwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.72], [16.0, 17.25], [18.0, 24.53], [32.0, 35.87], [36.0, 38.38], [39.0, 43.01], [45.0, 48.44], [50.0, 50.87]], "keep_status": [false, false, false, false, true, true, false, false], "silence_prob": [32.85, 0.0, 67.76, 88.28, 36.7, 39.31, 60.05, 0.0], "audiomae_on_audioset": [[["speech", 58.66], ["hum", 9.29], ["hiccup", 6.91]], null, null, null, [["speech", 34.23], ["whale vocalization", 10.65], ["wail, moan", 6.16]], [["pant", 29.09], ["groan", 12.22], ["grunt", 10.36]], null, null], "duration": [6.72, 1.25, 6.53, 3.87, 2.38, 4.01, 3.44, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/vT3QXNKoZKw_filtered.json b/annotations_filtered/vT3QXNKoZKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1abeda8a16fd7a29ca6042bb27e562c7fbf786db --- /dev/null +++ b/annotations_filtered/vT3QXNKoZKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.55], [15.0, 21.14], [22.0, 22.79], [25.0, 28.88], [30.0, 30.65], [34.0, 39.45], [48.0, 50.63], [53.0, 57.94], [61.0, 63.26], [64.0, 65.4], [66.0, 69.48], [73.0, 73.4], [75.0, 91.94], [93.0, 95.62], [96.0, 102.56], [104.0, 105.26]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [100.0, 99.36, 0.0, 100.0, 0.0, 100.0, 98.27, 48.74, 94.37, 0.0, 79.94, 0.0, 37.0, 38.67, 35.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 47.25], ["speech", 19.66], ["singing bowl", 2.2]], null, null, null, null, [["music", 53.08], ["synthesizer", 15.47], ["musical instrument", 3.99]], [["music", 57.38], ["didgeridoo", 6.68], ["synthesizer", 5.05]], [["music", 58.41], ["theremin", 6.15], ["ambient music", 5.27]], null], "duration": [8.55, 6.14, 0.79, 3.88, 0.65, 5.45, 2.63, 4.94, 2.26, 1.4, 3.48, 0.4, 16.94, 2.62, 6.56, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/vT4HrbzMVgI_filtered.json b/annotations_filtered/vT4HrbzMVgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87717d048953fe357256a5d0bc48532bac50f8df --- /dev/null +++ b/annotations_filtered/vT4HrbzMVgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 94.73]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [93.73]} \ No newline at end of file diff --git a/annotations_filtered/vT6xS0mRapg_filtered.json b/annotations_filtered/vT6xS0mRapg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cbebe6b4edafa08c6e69d0bbbe1f3a5c2415b64 --- /dev/null +++ b/annotations_filtered/vT6xS0mRapg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [7.0, 8.41], [34.0, 34.3], [45.0, 46.16], [49.0, 49.45], [54.0, 55.19], [70.0, 77.33], [85.0, 85.31], [88.0, 88.7], [93.0, 93.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.41, 0.3, 1.16, 0.45, 1.19, 7.33, 0.31, 0.7, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/vTSmbMm7MDg_filtered.json b/annotations_filtered/vTSmbMm7MDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19eeb81ebb586a382835ed15a3be1e0856ba622 --- /dev/null +++ b/annotations_filtered/vTSmbMm7MDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [11.0, 10.96], [11.0, 11.5], [13.0, 13.88], [15.0, 16.5], [51.0, 51.07], [56.0, 56.39], [94.0, 94.14], [114.0, 114.17], [153.0, 153.47], [162.0, 162.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, -0.04, 0.5, 0.88, 1.5, 0.07, 0.39, 0.14, 0.17, 0.47, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/vTTzWRdAN4M_filtered.json b/annotations_filtered/vTTzWRdAN4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26ff529c41c5e086332535c56c4bb79eaeeefca2 --- /dev/null +++ b/annotations_filtered/vTTzWRdAN4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.86], [11.0, 11.5], [16.0, 17.52], [24.0, 24.63], [26.0, 26.42], [27.0, 49.6], [55.0, 55.81], [61.0, 65.57], [68.0, 69.53], [73.0, 74.9], [78.0, 79.54], [80.0, 80.22], [85.0, 85.24], [90.0, 95.86], [97.0, 97.66], [100.0, 100.75], [109.0, 109.58], [111.0, 111.5], [114.0, 121.17], [135.0, 135.18], [143.0, 146.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.46, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.77], ["fart", 10.43], ["creak", 8.47]], null, null, null, null, null, null, null], "duration": [5.86, 0.5, 1.52, 0.63, 0.42, 22.6, 0.81, 4.57, 1.53, 1.9, 1.54, 0.22, 0.24, 5.86, 0.66, 0.75, 0.58, 0.5, 7.17, 0.18, 3.96]} \ No newline at end of file diff --git a/annotations_filtered/vTeY6H581pg_filtered.json b/annotations_filtered/vTeY6H581pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0ffef94218a8361be9a8b8b0a986b13039da7ef --- /dev/null +++ b/annotations_filtered/vTeY6H581pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [5.0, 6.91], [7.0, 12.99], [14.0, 15.52], [33.0, 33.0], [33.0, 36.61], [37.0, 38.92], [45.0, 44.88], [54.0, 54.9], [57.0, 56.88], [62.0, 63.12], [70.0, 71.31], [79.0, 78.97], [84.0, 87.83], [95.0, 95.98], [98.0, 99.18], [104.0, 104.36], [105.0, 105.54], [108.0, 108.4], [109.0, 110.05], [111.0, 114.29], [136.0, 135.94], [142.0, 142.69], [143.0, 144.8], [164.0, 170.21], [171.0, 173.08], [178.0, 178.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.17, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 75.39, 69.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 1.91, 5.99, 1.52, 0.0, 3.61, 1.92, -0.12, 0.9, -0.12, 1.12, 1.31, -0.03, 3.83, 0.98, 1.18, 0.36, 0.54, 0.4, 1.05, 3.29, -0.06, 0.69, 1.8, 6.21, 2.08, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/vTy2bx3jmrs_filtered.json b/annotations_filtered/vTy2bx3jmrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8ea7065068ce7546b57271ce5c783143aab26f4 --- /dev/null +++ b/annotations_filtered/vTy2bx3jmrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.47], [15.0, 15.87], [17.0, 20.97], [22.0, 22.55], [23.0, 25.44], [26.0, 27.46], [28.0, 28.9], [30.0, 31.21], [32.0, 33.78], [35.0, 35.75], [36.0, 38.5], [39.0, 41.66], [43.0, 43.61], [44.0, 44.42], [45.0, 44.96], [45.0, 47.6], [49.0, 51.56], [54.0, 56.39], [57.0, 58.35], [60.0, 73.35], [74.0, 75.81], [78.0, 79.78], [80.0, 79.86], [80.0, 79.93], [80.0, 80.74], [85.0, 85.53], [87.0, 87.69], [92.0, 92.23], [93.0, 93.26], [93.0, 93.43], [93.0, 93.46], [93.0, 96.5], [98.0, 103.55], [107.0, 107.82], [111.0, 119.08], [120.0, 124.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 99.99, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.91, 0.0, 0.0, 0.0, 92.31, 99.71, 99.82, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 99.95, 0.0, 91.47, 98.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.47, 0.87, 3.97, 0.55, 2.44, 1.46, 0.9, 1.21, 1.78, 0.75, 2.5, 2.66, 0.61, 0.42, -0.04, 2.6, 2.56, 2.39, 1.35, 13.35, 1.81, 1.78, -0.14, -0.07, 0.74, 0.53, 0.69, 0.23, 0.26, 0.43, 0.46, 3.5, 5.55, 0.82, 8.08, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/vU1_EJh6Atc_filtered.json b/annotations_filtered/vU1_EJh6Atc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79d40a76a535738eb5b8f63a1dbd670b6b1eb1bd --- /dev/null +++ b/annotations_filtered/vU1_EJh6Atc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.17]], "keep_status": [false], "silence_prob": [33.22], "audiomae_on_audioset": [[["music", 70.28], ["hum", 4.58], ["electronic music", 4.49]]], "duration": [7.17]} \ No newline at end of file diff --git a/annotations_filtered/vUbnqySPN8E_filtered.json b/annotations_filtered/vUbnqySPN8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fedca087910de4860dc17240d4fca622da160e5 --- /dev/null +++ b/annotations_filtered/vUbnqySPN8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [6.0, 7.21], [11.0, 14.84], [15.0, 16.92], [18.0, 19.72], [22.0, 23.25], [24.0, 25.51], [27.0, 27.06], [28.0, 29.27], [30.0, 35.88], [37.0, 40.81], [43.0, 54.73], [55.0, 57.75], [58.0, 63.53], [65.0, 71.31], [74.0, 76.74], [78.0, 100.84], [106.0, 105.71], [106.0, 109.02], [111.0, 117.32], [122.0, 126.98], [133.0, 133.37], [135.0, 140.75], [143.0, 143.26], [145.0, 153.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 65.67, 0.0, 46.57, 59.42, 58.3, 0.0, 59.15, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.33], ["speech", 11.86], ["ambient music", 2.97]], null, null, null, null, null, null], "duration": [0.65, 1.21, 3.84, 1.92, 1.72, 1.25, 1.51, 0.06, 1.27, 5.88, 3.81, 11.73, 2.75, 5.53, 6.31, 2.74, 22.84, -0.29, 3.02, 6.32, 4.98, 0.37, 5.75, 0.26, 8.94]} \ No newline at end of file diff --git a/annotations_filtered/vUgs2O7Okqc_filtered.json b/annotations_filtered/vUgs2O7Okqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aebf7077ad4938dfa1744094ecc741cd8eef92f3 --- /dev/null +++ b/annotations_filtered/vUgs2O7Okqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [8.0, 9.37], [10.0, 11.75], [13.0, 14.55], [17.0, 19.89], [22.0, 22.49], [25.0, 26.52], [27.0, 29.13], [36.0, 37.71], [38.0, 40.98], [42.0, 42.6], [45.0, 48.61], [54.0, 56.34], [61.0, 63.15], [64.0, 67.12], [70.0, 71.29], [73.0, 73.4], [74.0, 76.18], [78.0, 79.44], [80.0, 81.97], [85.0, 87.59], [91.0, 92.16], [95.0, 95.77], [97.0, 98.58], [100.0, 101.71]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 34.72, 0.0, 62.17, 0.0, 95.78, 59.42, 59.96, 51.82, 0.0, 0.0, 74.44, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 31.47], ["didgeridoo", 22.45], ["boing", 9.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.37, 1.75, 1.55, 2.89, 0.49, 1.52, 2.13, 1.71, 2.98, 0.6, 3.61, 2.34, 2.15, 3.12, 1.29, 0.4, 2.18, 1.44, 1.97, 2.59, 1.16, 0.77, 1.58, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/vUrgn1Vm86I_filtered.json b/annotations_filtered/vUrgn1Vm86I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a1bd1de1cd973b1d1577153b787e83e25af5b0e --- /dev/null +++ b/annotations_filtered/vUrgn1Vm86I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.3], [4.0, 5.86], [10.0, 15.97], [17.0, 19.99], [20.0, 20.44], [22.0, 22.47], [26.0, 28.83], [31.0, 34.32], [35.0, 35.61], [37.0, 36.83], [37.0, 38.74], [40.0, 49.08], [50.0, 80.35], [86.0, 110.47], [117.0, 119.18], [120.0, 123.6], [124.0, 124.92], [126.0, 126.99], [128.0, 129.03], [130.0, 131.25], [132.0, 132.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [85.35, 0.0, 79.76, 52.68, 0.0, 0.0, 97.11, 93.76, 0.0, 0.0, 0.0, 71.14, 0.0, 32.78, 32.28, 42.86, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["electric shaver, electric razor", 25.03], ["mains hum", 19.98], ["music", 14.31]], [["music", 54.16], ["throbbing", 11.69], ["speech", 5.45]], [["speech", 65.24], ["music", 7.26], ["hum", 5.49]], null, null, null, null, null], "duration": [2.3, 1.86, 5.97, 2.99, 0.44, 0.47, 2.83, 3.32, 0.61, -0.17, 1.74, 9.08, 30.35, 24.47, 2.18, 3.6, 0.92, 0.99, 1.03, 1.25, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/vUuAbRVVZwA_filtered.json b/annotations_filtered/vUuAbRVVZwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75c9c1595a226dc14b31e1745dc2e6faf958ca21 --- /dev/null +++ b/annotations_filtered/vUuAbRVVZwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.27], [10.0, 12.6], [16.0, 16.87], [18.0, 21.83], [25.0, 26.45], [29.0, 31.35], [36.0, 36.14], [38.0, 39.58], [44.0, 49.54], [50.0, 50.8], [52.0, 52.76], [55.0, 55.71], [58.0, 62.36], [63.0, 65.37], [66.0, 67.54], [69.0, 72.69], [74.0, 79.14], [83.0, 92.23], [94.0, 95.71], [98.0, 98.24], [100.0, 105.66], [107.0, 109.09], [110.0, 116.24], [117.0, 118.23], [119.0, 121.34], [122.0, 130.84], [133.0, 148.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [97.33, 79.76, 0.0, 92.31, 0.0, 91.64, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 78.21, 72.46, 0.0, 96.66, 100.0, 99.91, 0.0, 0.0, 40.79, 99.98, 45.11, 0.0, 98.66, 56.25, 70.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.7], ["musical instrument", 19.08], ["synthesizer", 5.86]], null, [["sonar", 43.69], ["music", 20.59], ["electronic music", 5.5]], null, null, null, null], "duration": [8.27, 2.6, 0.87, 3.83, 1.45, 2.35, 0.14, 1.58, 5.54, 0.8, 0.76, 0.71, 4.36, 2.37, 1.54, 3.69, 5.14, 9.23, 1.71, 0.24, 5.66, 2.09, 6.24, 1.23, 2.34, 8.84, 15.14]} \ No newline at end of file diff --git a/annotations_filtered/vUzF61mtilA_filtered.json b/annotations_filtered/vUzF61mtilA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd3547092448d027435301e1cde33c2756a8765 --- /dev/null +++ b/annotations_filtered/vUzF61mtilA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.59], [32.0, 43.63], [47.0, 48.03], [49.0, 50.5], [53.0, 53.65], [54.0, 57.54], [58.0, 59.1], [62.0, 63.34], [65.0, 74.22], [77.0, 89.88], [91.0, 95.01], [95.0, 95.27], [95.0, 101.68], [104.0, 117.76], [124.0, 124.53], [125.0, 125.64], [127.0, 138.1], [141.0, 141.62], [145.0, 154.94], [159.0, 172.08], [175.0, 175.05], [176.0, 177.79], [181.0, 182.02]], "keep_status": [true, true, false, false, false, false, false, false, true, true, true, false, false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [32.51, 30.04, 0.0, 0.0, 0.0, 37.3, 0.0, 0.0, 30.52, 31.97, 30.49, 0.0, 30.23, 29.58, 0.0, 0.0, 29.93, 0.0, 30.78, 30.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 42.73], ["speech", 20.78], ["electronic music", 4.51]], [["music", 25.5], ["buzz", 18.66], ["speech", 8.9]], null, null, null, [["music", 53.77], ["speech", 12.18], ["synthesizer", 6.19]], null, null, [["livestock, farm animals, working animals", 39.61], ["cattle, bovinae", 14.18], ["vehicle", 10.29]], [["music", 25.17], ["livestock, farm animals, working animals", 23.74], ["throbbing", 13.51]], [["music", 33.03], ["hum", 20.16], ["throbbing", 16.67]], null, [["speech", 52.12], ["music", 24.83], ["noise", 4.49]], [["speech", 22.13], ["hum", 20.52], ["music", 17.22]], null, null, [["hum", 21.68], ["music", 18.55], ["mains hum", 14.75]], null, [["music", 77.09], ["fly, housefly", 4.06], ["speech", 2.0]], [["speech", 28.07], ["music", 24.9], ["hum", 12.76]], null, null, null], "duration": [2.59, 11.63, 1.03, 1.5, 0.65, 3.54, 1.1, 1.34, 9.22, 12.88, 4.01, 0.27, 6.68, 13.76, 0.53, 0.64, 11.1, 0.62, 9.94, 13.08, 0.05, 1.79, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/vV30irsal-w_filtered.json b/annotations_filtered/vV30irsal-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab139bd736ce85627af832322724fc5cb03ceab9 --- /dev/null +++ b/annotations_filtered/vV30irsal-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.43], [31.0, 37.67], [46.0, 46.45], [47.0, 48.15], [60.0, 60.35], [66.0, 65.85], [91.0, 90.93], [95.0, 95.67], [103.0, 106.71], [107.0, 107.99], [109.0, 109.63], [111.0, 111.77], [112.0, 114.96], [128.0, 130.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 43.66, 88.1], "audiomae_on_audioset": [null, [["music", 72.42], ["speech", 9.55], ["boing", 4.08]], null, null, null, null, null, null, null, null, null, null, [["music", 53.08], ["guitar", 4.73], ["chirp tone", 4.09]], null], "duration": [0.43, 6.67, 0.45, 1.15, 0.35, -0.15, -0.07, 0.67, 3.71, 0.99, 0.63, 0.77, 2.96, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/vV3RTL40nmw_filtered.json b/annotations_filtered/vV3RTL40nmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd18ced690dce8b48e29228d4e6a5e9ca9031525 --- /dev/null +++ b/annotations_filtered/vV3RTL40nmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.93], [16.0, 17.46], [19.0, 19.75], [20.0, 30.55], [37.0, 36.78], [39.0, 41.84], [42.0, 43.44], [45.0, 47.24], [49.0, 53.18], [54.0, 54.13], [63.0, 64.1], [65.0, 66.12], [67.0, 68.39], [70.0, 70.87], [71.0, 78.36], [82.0, 82.85], [83.0, 83.94], [88.0, 88.59], [90.0, 90.37], [91.0, 92.08], [95.0, 95.44], [96.0, 103.27], [104.0, 106.51], [108.0, 118.47], [119.0, 137.62], [138.0, 138.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.17, 0.0, 0.0, 69.47, 0.0, 68.28, 0.0, 72.16, 63.74, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 68.02, 66.88, 66.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.93, 1.46, 0.75, 10.55, -0.22, 2.84, 1.44, 2.24, 4.18, 0.13, 1.1, 1.12, 1.39, 0.87, 7.36, 0.85, 0.94, 0.59, 0.37, 1.08, 0.44, 7.27, 2.51, 10.47, 18.62, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/vVPtQKHiWwM_filtered.json b/annotations_filtered/vVPtQKHiWwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c46aef5a446da71163a0a161e25e2e98c146b90 --- /dev/null +++ b/annotations_filtered/vVPtQKHiWwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.51], [19.0, 19.89], [25.0, 26.11], [27.0, 29.25], [30.0, 31.6], [33.0, 33.35], [35.0, 35.8], [36.0, 36.58], [37.0, 38.01], [38.0, 38.99], [39.0, 41.32], [42.0, 42.8], [44.0, 44.19], [46.0, 47.46], [49.0, 49.5], [52.0, 53.69], [55.0, 56.27], [58.0, 59.17], [61.0, 62.94], [64.0, 65.31], [68.0, 70.71], [75.0, 79.07], [81.0, 83.39], [84.0, 84.11], [85.0, 86.54], [87.0, 88.13], [88.0, 102.49], [105.0, 107.35], [109.0, 111.35], [113.0, 114.45], [116.0, 117.09], [119.0, 120.93], [122.0, 129.25]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [47.05, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 60.23, 99.56, 0.0, 0.0, 0.0, 32.62, 82.25, 67.13, 0.0, 0.0, 0.0, 43.05], "audiomae_on_audioset": [[["music", 55.48], ["speech", 10.42], ["musical instrument", 3.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.41], ["music", 6.24], ["buzz", 2.81]], null, null, null, null, null, [["music", 69.44], ["theremin", 6.6], ["cello", 3.79]]], "duration": [3.51, 0.89, 1.11, 2.25, 1.6, 0.35, 0.8, 0.58, 1.01, 0.99, 2.32, 0.8, 0.19, 1.46, 0.5, 1.69, 1.27, 1.17, 1.94, 1.31, 2.71, 4.07, 2.39, 0.11, 1.54, 1.13, 14.49, 2.35, 2.35, 1.45, 1.09, 1.93, 7.25]} \ No newline at end of file diff --git a/annotations_filtered/vVRPMleD1SI_filtered.json b/annotations_filtered/vVRPMleD1SI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e4c6da06cbd15e3746c0b2383af2efbab781819 --- /dev/null +++ b/annotations_filtered/vVRPMleD1SI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.31], [13.0, 20.61], [22.0, 32.91], [35.0, 40.39], [40.0, 53.15], [55.0, 56.42], [59.0, 59.9], [61.0, 61.32], [63.0, 63.1], [66.0, 66.55], [67.0, 67.71], [68.0, 69.45], [73.0, 73.87], [74.0, 78.71], [80.0, 83.24], [85.0, 86.97], [88.0, 89.45], [91.0, 92.18], [95.0, 98.68], [99.0, 100.04], [102.0, 104.79], [107.0, 114.72], [117.0, 120.95], [121.0, 126.52], [129.0, 132.93], [136.0, 147.34]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [46.22, 46.4, 41.74, 41.03, 50.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 63.96, 0.0, 0.0, 0.0, 58.55, 0.0, 97.0, 57.64, 64.07, 49.31, 45.27, 38.5], "audiomae_on_audioset": [[["music", 43.24], ["speech", 18.3], ["theremin", 6.68]], [["music", 39.93], ["theremin", 18.11], ["bird", 7.75]], [["music", 48.29], ["theremin", 7.63], ["bird", 6.09]], [["theremin", 37.79], ["music", 17.37], ["speech", 9.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.89], ["speech", 23.31], ["animal", 6.32]], [["music", 41.68], ["speech", 14.77], ["keyboard (musical)", 9.26]], [["music", 46.69], ["theremin", 9.19], ["keyboard (musical)", 6.77]]], "duration": [2.31, 7.61, 10.91, 5.39, 13.15, 1.42, 0.9, 0.32, 0.1, 0.55, 0.71, 1.45, 0.87, 4.71, 3.24, 1.97, 1.45, 1.18, 3.68, 1.04, 2.79, 7.72, 3.95, 5.52, 3.93, 11.34]} \ No newline at end of file diff --git a/annotations_filtered/vVjfW-P5yZY_filtered.json b/annotations_filtered/vVjfW-P5yZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..032115d3dba65037a7d6b3b11baa44000d1b683e --- /dev/null +++ b/annotations_filtered/vVjfW-P5yZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.89], [17.0, 17.56], [19.0, 21.15], [22.0, 22.82], [27.0, 27.48], [29.0, 28.61], [31.0, 31.55], [32.0, 35.01], [35.0, 45.23], [46.0, 48.15], [48.0, 56.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 59.33, 66.39, 67.25, 57.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.89, 0.56, 2.15, 0.82, 0.48, -0.39, 0.55, 3.01, 10.23, 2.15, 8.94]} \ No newline at end of file diff --git a/annotations_filtered/vVmZO3W0I1A_filtered.json b/annotations_filtered/vVmZO3W0I1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5d530ba03d214ae8099d8566773192dfd1788c7 --- /dev/null +++ b/annotations_filtered/vVmZO3W0I1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.42], [18.0, 18.77], [20.0, 21.1], [23.0, 23.43], [25.0, 25.22], [27.0, 27.33], [28.0, 42.8], [44.0, 47.43], [48.0, 53.03], [54.0, 58.28], [59.0, 68.89], [76.0, 77.77], [79.0, 80.96], [83.0, 86.83], [88.0, 89.7], [92.0, 95.79], [98.0, 99.2], [101.0, 101.73], [116.0, 118.05], [123.0, 124.66], [127.0, 127.18], [128.0, 140.44], [140.0, 140.51]], "keep_status": [true, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 39.47, 30.32, 32.5, 31.37, 0.0, 0.0, 30.9, 0.0, 31.48, 0.0, 0.0, 33.36, 0.0, 0.0, 30.37, 0.0], "audiomae_on_audioset": [[["music", 26.05], ["throbbing", 12.83], ["speech", 7.55]], null, null, null, null, null, [["hum", 44.5], ["throbbing", 20.49], ["music", 13.34]], [["music", 24.73], ["hum", 18.96], ["throbbing", 10.69]], [["breaking", 42.29], ["music", 12.5], ["smash, crash", 10.31]], [["boing", 26.66], ["thunk", 13.04], ["speech", 12.39]], [["throbbing", 44.51], ["music", 30.47], ["hum", 18.83]], null, null, [["speech", 47.1], ["music", 17.42], ["explosion", 5.46]], null, [["speech", 37.83], ["breaking", 34.62], ["smash, crash", 9.84]], null, null, [["foghorn", 50.7], ["music", 17.34], ["hum", 8.89]], null, null, [["music", 37.02], ["throbbing", 31.29], ["speech", 15.18]], null], "duration": [2.42, 0.77, 1.1, 0.43, 0.22, 0.33, 14.8, 3.43, 5.03, 4.28, 9.89, 1.77, 1.96, 3.83, 1.7, 3.79, 1.2, 0.73, 2.05, 1.66, 0.18, 12.44, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/vVqCU0iWlFM_filtered.json b/annotations_filtered/vVqCU0iWlFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa867295e4f26ef6a37036d5007a1023a4813cb --- /dev/null +++ b/annotations_filtered/vVqCU0iWlFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.78], [2.0, 34.06], [36.0, 67.85], [69.0, 138.65], [139.0, 152.39], [163.0, 164.0], [175.0, 189.46]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.78, 32.06, 31.85, 69.65, 13.39, 1.0, 14.46]} \ No newline at end of file diff --git a/annotations_filtered/vW4TOsL7e3M_filtered.json b/annotations_filtered/vW4TOsL7e3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3992a749b7b9274fe95b6f642d1243e4056c4afb --- /dev/null +++ b/annotations_filtered/vW4TOsL7e3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.11], [33.0, 33.64], [38.0, 45.89], [47.0, 49.99], [51.0, 53.52], [55.0, 55.63], [57.0, 56.94], [60.0, 62.34], [66.0, 68.27], [69.0, 69.6], [71.0, 72.03], [73.0, 74.11], [81.0, 82.07], [84.0, 85.65], [89.0, 90.91], [92.0, 92.55], [96.0, 97.6], [98.0, 99.54], [102.0, 104.45], [105.0, 108.21], [111.0, 114.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.78, 44.55, 74.13, 0.0, 0.0, 81.89, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 36.28, 51.18], "audiomae_on_audioset": [null, null, [["music", 75.97], ["musical instrument", 7.54], ["guitar", 3.82]], [["fly, housefly", 22.14], ["insect", 16.25], ["music", 13.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.79], ["hum", 16.59], ["mains hum", 6.99]], null], "duration": [1.11, 0.64, 7.89, 2.99, 2.52, 0.63, -0.06, 2.34, 2.27, 0.6, 1.03, 1.11, 1.07, 1.65, 1.91, 0.55, 1.6, 1.54, 2.45, 3.21, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/vW7-H-GGYwk_filtered.json b/annotations_filtered/vW7-H-GGYwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8282f8aee7c58a380f6bb49924db86dd412602f7 --- /dev/null +++ b/annotations_filtered/vW7-H-GGYwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 21.74], [25.0, 25.3], [25.0, 38.47], [40.0, 40.83], [47.0, 53.22], [57.0, 71.19], [75.0, 81.24], [82.0, 121.54], [122.0, 122.25]], "keep_status": [false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 32.1, 0.0, 31.74, 31.64, 32.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.41], ["hum", 13.7], ["speech", 11.75]], null, [["music", 36.5], ["hum", 18.92], ["mains hum", 14.66]], [["music", 27.86], ["speech", 15.74], ["vehicle", 13.16]], [["hum", 27.03], ["music", 19.09], ["speech", 16.08]], null, null], "duration": [-0.26, 0.3, 13.47, 0.83, 6.22, 14.19, 6.24, 39.54, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/vWZapP8b11s_filtered.json b/annotations_filtered/vWZapP8b11s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20022c58ffbaf7dbecb3a3e153a43362c2bfa881 --- /dev/null +++ b/annotations_filtered/vWZapP8b11s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [7.0, 9.04], [11.0, 17.0], [18.0, 20.11], [22.0, 23.7], [26.0, 27.48], [41.0, 40.76], [48.0, 51.34], [52.0, 53.49], [55.0, 55.63], [58.0, 58.4], [69.0, 69.82], [75.0, 77.01], [82.0, 83.94], [85.0, 86.95], [89.0, 94.36], [97.0, 100.25], [101.0, 102.54], [105.0, 108.06], [108.0, 114.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.01, 88.28, 76.7, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 72.16, 81.35, 0.0, 75.39, 84.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.92, 2.04, 6.0, 2.11, 1.7, 1.48, -0.24, 3.34, 1.49, 0.63, 0.4, 0.82, 2.01, 1.94, 1.95, 5.36, 3.25, 1.54, 3.06, 6.94]} \ No newline at end of file diff --git a/annotations_filtered/vWkJPL2Dt9A_filtered.json b/annotations_filtered/vWkJPL2Dt9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8154a3c75e0149f1c24b225aa0e0dc26900a8dcf --- /dev/null +++ b/annotations_filtered/vWkJPL2Dt9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [3.0, 4.8], [5.0, 6.86], [8.0, 10.12], [13.0, 14.59], [19.0, 21.36], [23.0, 24.63], [26.0, 28.56], [32.0, 33.74], [37.0, 40.69], [46.0, 47.7], [49.0, 53.6], [54.0, 56.91], [58.0, 89.28], [92.0, 93.14], [95.0, 97.33], [100.0, 100.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.82, 0.0, 100.0, 0.0, 100.0, 0.0, 94.37, 0.0, 99.62, 100.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.8, 1.86, 2.12, 1.59, 2.36, 1.63, 2.56, 1.74, 3.69, 1.7, 4.6, 2.91, 31.28, 1.14, 2.33, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/vWyPfvAbUOQ_filtered.json b/annotations_filtered/vWyPfvAbUOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4677d78e6b95f92e69723bd783bc337b4f3b2a94 --- /dev/null +++ b/annotations_filtered/vWyPfvAbUOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.03], [7.0, 8.04], [10.0, 10.39], [12.0, 12.8], [16.0, 16.44], [20.0, 21.09], [25.0, 26.2], [29.0, 29.27], [29.0, 29.86], [31.0, 34.06], [37.0, 37.37], [38.0, 38.62], [40.0, 44.54], [47.0, 48.57], [49.0, 52.39]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 88.28, 0.0, 46.15], "audiomae_on_audioset": [[["mosquito", 19.57], ["insect", 15.01], ["fly, housefly", 13.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 37.13], ["mosquito", 26.05], ["fly, housefly", 7.95]]], "duration": [2.03, 1.04, 0.39, 0.8, 0.44, 1.09, 1.2, 0.27, 0.86, 3.06, 0.37, 0.62, 4.54, 1.57, 3.39]} \ No newline at end of file diff --git a/annotations_filtered/vXLLH1eSOZE_filtered.json b/annotations_filtered/vXLLH1eSOZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4cb354517ce15fe4f3ff4ebcc3049e1efb59ae --- /dev/null +++ b/annotations_filtered/vXLLH1eSOZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.85], [25.0, 24.95], [25.0, 25.41], [27.0, 27.36], [30.0, 42.72], [44.0, 66.34], [68.0, 68.81], [71.0, 71.91], [81.0, 85.24]], "keep_status": [true, false, false, false, true, false, false, false, true], "silence_prob": [30.75, 0.0, 0.0, 0.0, 32.25, 30.44, 0.0, 0.0, 30.01], "audiomae_on_audioset": [[["speech", 25.66], ["music", 21.38], ["didgeridoo", 21.08]], null, null, null, [["speech", 37.68], ["noise", 14.7], ["music", 10.6]], [["music", 31.07], ["speech", 30.73], ["hum", 9.38]], null, null, [["explosion", 15.49], ["jet engine", 10.09], ["vehicle", 7.02]]], "duration": [2.85, -0.05, 0.41, 0.36, 12.72, 22.34, 0.81, 0.91, 4.24]} \ No newline at end of file diff --git a/annotations_filtered/vXNr2xtv09Y_filtered.json b/annotations_filtered/vXNr2xtv09Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4673d42a126ad1aa8031ab3343cf16aebc47a329 --- /dev/null +++ b/annotations_filtered/vXNr2xtv09Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [16.0, 17.36], [20.0, 21.84], [23.0, 22.77], [24.0, 31.06], [36.0, 36.86], [38.0, 39.75], [41.0, 42.8], [43.0, 50.77], [52.0, 58.09], [61.0, 62.41], [64.0, 65.55], [67.0, 67.64], [70.0, 71.34], [72.0, 73.57], [76.0, 76.81], [80.0, 81.5], [83.0, 84.08], [86.0, 85.94], [87.0, 91.12], [94.0, 97.61], [100.0, 100.18], [101.0, 101.43], [103.0, 102.96], [106.0, 106.52], [107.0, 108.31], [111.0, 111.52], [113.0, 116.92], [118.0, 118.79], [120.0, 121.49], [122.0, 123.28], [124.0, 126.27]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 99.52], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 26.79], ["chirp tone", 24.87], ["sine wave", 10.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 1.36, 1.84, -0.23, 7.06, 0.86, 1.75, 1.8, 7.77, 6.09, 1.41, 1.55, 0.64, 1.34, 1.57, 0.81, 1.5, 1.08, -0.06, 4.12, 3.61, 0.18, 0.43, -0.04, 0.52, 1.31, 0.52, 3.92, 0.79, 1.49, 1.28, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/vXQlXYcAksI_filtered.json b/annotations_filtered/vXQlXYcAksI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7baa237a980bc10f4ff5669138932cdbc28597cc --- /dev/null +++ b/annotations_filtered/vXQlXYcAksI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [8.0, 15.89], [16.0, 16.01], [16.0, 17.14], [20.0, 20.97], [23.0, 23.73], [27.0, 27.43], [31.0, 30.91], [32.0, 61.15], [69.0, 69.2], [70.0, 70.77], [79.0, 79.57], [81.0, 81.57], [84.0, 84.15], [102.0, 101.82]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 38.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 40.17], ["hum", 15.1], ["throbbing", 8.76]], null, null, null, null, null, null, [["music", 26.77], ["hum", 22.87], ["throbbing", 10.95]], null, null, null, null, null, null], "duration": [0.78, 7.89, 0.01, 1.14, 0.97, 0.73, 0.43, -0.09, 29.15, 0.2, 0.77, 0.57, 0.57, 0.15, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/vXXDqjLe4Ls_filtered.json b/annotations_filtered/vXXDqjLe4Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f819ee69bde2940340a4f2c4aaa314caee9e75c8 --- /dev/null +++ b/annotations_filtered/vXXDqjLe4Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [5.0, 5.85], [6.0, 6.37], [9.0, 9.58], [11.0, 11.25], [14.0, 14.35], [15.0, 15.84], [16.0, 18.28], [20.0, 20.29], [20.0, 22.18], [24.0, 23.85], [29.0, 29.96], [31.0, 36.46], [38.0, 37.71], [46.0, 47.78], [49.0, 54.89], [56.0, 56.13], [62.0, 63.27], [67.0, 69.04], [70.0, 70.75], [76.0, 83.76], [89.0, 90.64], [91.0, 155.93], [157.0, 159.78], [164.0, 165.21], [166.0, 170.26], [172.0, 180.98], [181.0, 184.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 51.82, 0.0, 0.0, 57.97, 0.0, 0.0, 46.15, 0.0, 0.0, 64.41, 0.0, 99.05, 0.0, 0.0, 47.62, 0.0, 76.04, 90.25, 61.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mouse", 20.68], ["speech", 16.12], ["animal", 12.98]], null, null, null, null, null, null, null, [["music", 46.79], ["theremin", 11.92], ["musical instrument", 4.04]], null, null, null, null], "duration": [0.7, 0.85, 0.37, 0.58, 0.25, 0.35, 0.84, 2.28, 0.29, 2.18, -0.15, 0.96, 5.46, -0.29, 1.78, 5.89, 0.13, 1.27, 2.04, 0.75, 7.76, 1.64, 64.93, 2.78, 1.21, 4.26, 8.98, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/vXsKVaJTQCA_filtered.json b/annotations_filtered/vXsKVaJTQCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd8be79e5d46c4b5d0dbe412446987f2f918e2de --- /dev/null +++ b/annotations_filtered/vXsKVaJTQCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [11.0, 11.6], [12.0, 14.05], [15.0, 15.18], [20.0, 20.55], [21.0, 22.15], [23.0, 23.31], [27.0, 27.28], [33.0, 33.39], [45.0, 46.9], [49.0, 49.64], [55.0, 56.91], [58.0, 58.31], [60.0, 60.99], [63.0, 62.95], [69.0, 69.35], [73.0, 73.11], [76.0, 76.67], [79.0, 79.15], [81.0, 80.89], [82.0, 83.39], [85.0, 87.94], [90.0, 89.9], [90.0, 90.88], [93.0, 93.51], [95.0, 95.81], [96.0, 96.85], [100.0, 100.52], [101.0, 101.61], [102.0, 103.4], [107.0, 107.76], [111.0, 111.06], [119.0, 122.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.6, 2.05, 0.18, 0.55, 1.15, 0.31, 0.28, 0.39, 1.9, 0.64, 1.91, 0.31, 0.99, -0.05, 0.35, 0.11, 0.67, 0.15, -0.11, 1.39, 2.94, -0.1, 0.88, 0.51, 0.81, 0.85, 0.52, 0.61, 1.4, 0.76, 0.06, 3.84]} \ No newline at end of file diff --git a/annotations_filtered/vY04JLQa1MQ_filtered.json b/annotations_filtered/vY04JLQa1MQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..358bddc2dc23e2bbc292613ded2c6a0433d36c9c --- /dev/null +++ b/annotations_filtered/vY04JLQa1MQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [8.0, 8.72], [15.0, 15.36], [22.0, 24.14], [25.0, 26.37], [31.0, 31.36], [32.0, 32.22], [32.0, 37.67], [39.0, 59.21], [64.0, 64.45], [68.0, 68.27], [74.0, 74.48], [76.0, 75.88], [77.0, 77.06], [78.0, 78.39], [83.0, 82.95], [85.0, 85.01], [91.0, 91.25], [97.0, 97.68], [102.0, 102.02], [109.0, 109.02], [114.0, 113.85], [115.0, 115.23], [121.0, 121.78], [125.0, 124.7], [128.0, 128.53], [129.0, 129.59], [130.0, 131.36], [132.0, 132.44], [135.0, 137.29], [139.0, 143.55], [145.0, 145.17], [146.0, 146.18], [147.0, 147.19], [148.0, 150.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 70.72, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 100.0, 0.0, 0.0, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 0.72, 0.36, 2.14, 1.37, 0.36, 0.22, 5.67, 20.21, 0.45, 0.27, 0.48, -0.12, 0.06, 0.39, -0.05, 0.01, 0.25, 0.68, 0.02, 0.02, -0.15, 0.23, 0.78, -0.3, 0.53, 0.59, 1.36, 0.44, 2.29, 4.55, 0.17, 0.18, 0.19, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/vYH5urNq1Ao_filtered.json b/annotations_filtered/vYH5urNq1Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c12148993523f5235da56689d07d43bc61e57b34 --- /dev/null +++ b/annotations_filtered/vYH5urNq1Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [9.0, 9.91], [13.0, 14.69], [16.0, 20.53], [23.0, 23.75], [24.0, 25.27], [32.0, 33.22], [34.0, 35.6], [37.0, 37.76], [40.0, 40.49], [44.0, 53.91], [57.0, 58.58], [70.0, 71.83], [75.0, 74.76], [78.0, 79.83], [82.0, 82.51], [85.0, 88.16], [89.0, 89.83], [94.0, 95.0], [98.0, 98.27], [102.0, 102.51], [104.0, 106.78], [110.0, 116.24], [120.0, 121.1], [122.0, 122.12], [123.0, 123.48], [125.0, 128.8], [133.0, 133.1], [135.0, 145.25], [146.0, 149.99], [151.0, 154.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 52.56, 98.36, 0.0, 0.0, 0.0, 54.9, 0.0, 48.35, 83.52, 81.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 44.39], ["music", 17.79], ["mains hum", 12.76]], null, null], "duration": [1.68, 0.91, 1.69, 4.53, 0.75, 1.27, 1.22, 1.6, 0.76, 0.49, 9.91, 1.58, 1.83, -0.24, 1.83, 0.51, 3.16, 0.83, 1.0, 0.27, 0.51, 2.78, 6.24, 1.1, 0.12, 0.48, 3.8, 0.1, 10.25, 3.99, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/vYafR-6wNGE_filtered.json b/annotations_filtered/vYafR-6wNGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3d02f549cb6386a053ab5a212b10b10ab7fbf8a --- /dev/null +++ b/annotations_filtered/vYafR-6wNGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.12], [2.0, 2.78], [4.0, 4.01], [5.0, 6.78], [10.0, 11.96], [14.0, 15.75], [17.0, 17.12], [18.0, 19.48], [21.0, 22.94], [23.0, 24.17], [25.0, 26.65], [28.0, 28.7], [31.0, 32.44], [33.0, 33.4], [35.0, 35.28], [37.0, 38.79], [40.0, 40.73], [41.0, 65.47], [67.0, 67.54], [71.0, 71.68], [72.0, 73.4], [75.0, 75.95], [77.0, 77.84], [83.0, 84.69], [90.0, 92.37], [94.0, 96.23], [103.0, 103.3], [104.0, 105.51], [112.0, 113.21], [113.0, 114.37], [115.0, 116.58], [119.0, 120.16], [124.0, 124.6], [125.0, 125.42], [127.0, 128.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.78, 0.01, 1.78, 1.96, 1.75, 0.12, 1.48, 1.94, 1.17, 1.65, 0.7, 1.44, 0.4, 0.28, 1.79, 0.73, 24.47, 0.54, 0.68, 1.4, 0.95, 0.84, 1.69, 2.37, 2.23, 0.3, 1.51, 1.21, 1.37, 1.58, 1.16, 0.6, 0.42, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/vYm_2A_cg0Y_filtered.json b/annotations_filtered/vYm_2A_cg0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43369ed4fd6b5dd89c6cf3a09021706fbfc9c199 --- /dev/null +++ b/annotations_filtered/vYm_2A_cg0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [6.0, 6.81], [10.0, 12.16], [16.0, 27.41], [28.0, 46.5], [47.0, 47.48], [50.0, 49.99], [52.0, 99.35], [101.0, 101.19]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 90.08, 40.48, 38.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 30.61], ["sidetone", 24.74], ["music", 11.49]], [["music", 32.14], ["throbbing", 23.87], ["electronic music", 13.12]], null, null, null, null], "duration": [1.13, 0.81, 2.16, 11.41, 18.5, 0.48, -0.01, 47.35, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/vYtc_bS47oM_filtered.json b/annotations_filtered/vYtc_bS47oM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..928641d69acaa1d4085ec96f43b010e589345988 --- /dev/null +++ b/annotations_filtered/vYtc_bS47oM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.72], [17.0, 25.68], [27.0, 28.8], [31.0, 31.43], [34.0, 36.31], [41.0, 42.06], [45.0, 45.47], [46.0, 46.99], [48.0, 48.07], [49.0, 49.77], [53.0, 55.61], [60.0, 61.5], [64.0, 64.27], [65.0, 66.97], [80.0, 80.57], [85.0, 86.22], [87.0, 87.81], [90.0, 90.96], [95.0, 94.83], [97.0, 97.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 97.43, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 60.62], ["fart", 3.77], ["inside, small room", 3.44]], null, null, null, null, null, null, null, null, null], "duration": [6.72, 8.68, 1.8, 0.43, 2.31, 1.06, 0.47, 0.99, 0.07, 0.77, 2.61, 1.5, 0.27, 1.97, 0.57, 1.22, 0.81, 0.96, -0.17, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/vZ3nHOtlQiU_filtered.json b/annotations_filtered/vZ3nHOtlQiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..939ed6a0844082a2f05e8ee9ddfef0f8105ea351 --- /dev/null +++ b/annotations_filtered/vZ3nHOtlQiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.88], [12.0, 13.76], [15.0, 17.39], [18.0, 22.84], [27.0, 42.65], [43.0, 43.95], [46.0, 90.61], [92.0, 95.52], [97.0, 102.39], [104.0, 114.93], [118.0, 118.67], [120.0, 121.12], [122.0, 128.51], [129.0, 129.95], [131.0, 130.94]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.38, 62.89, 37.26, 0.0, 0.0, 36.69, 35.79, 28.49, 0.0, 0.0, 30.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.39], ["speech", 13.9], ["fly, housefly", 10.26]], null, null, [["music", 54.32], ["throbbing", 16.14], ["hum", 10.06]], [["music", 52.89], ["hum", 17.17], ["throbbing", 14.95]], [["music", 50.12], ["rumble", 7.83], ["hum", 4.99]], null, null, [["speech", 55.78], ["fart", 11.77], ["groan", 6.05]], null, null], "duration": [1.88, 1.76, 2.39, 4.84, 15.65, 0.95, 44.61, 3.52, 5.39, 10.93, 0.67, 1.12, 6.51, 0.95, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/vZHS1nXJaGU_filtered.json b/annotations_filtered/vZHS1nXJaGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76678287cc892954e70af1b6693093dcd44167d7 --- /dev/null +++ b/annotations_filtered/vZHS1nXJaGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.88], [22.0, 22.05], [32.0, 35.63], [38.0, 43.68], [46.0, 46.31], [47.0, 47.01], [48.0, 48.91], [55.0, 55.68], [59.0, 59.98], [64.0, 65.37], [65.0, 65.5], [66.0, 66.97], [68.0, 68.59], [87.0, 87.51], [91.0, 95.3], [97.0, 98.37]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 40.34, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.52, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 24.41], ["speech", 16.8], ["rumble", 15.63]], [["whale vocalization", 70.8], ["hum", 8.21], ["noise", 6.56]], null, null, null, null, null, null, null, null, null, null, [["chirp tone", 18.34], ["sine wave", 13.58], ["music", 9.81]], null], "duration": [-0.12, 0.05, 3.63, 5.68, 0.31, 0.01, 0.91, 0.68, 0.98, 1.37, 0.5, 0.97, 0.59, 0.51, 4.3, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/vZKaVV0ZyFs_filtered.json b/annotations_filtered/vZKaVV0ZyFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f291517f8a9fb0cb49afba9c3c66405b74b815ba --- /dev/null +++ b/annotations_filtered/vZKaVV0ZyFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.41], [16.0, 17.32], [22.0, 45.08], [48.0, 63.44], [63.0, 64.35], [66.0, 77.53], [78.0, 79.98], [85.0, 85.04], [89.0, 98.46], [103.0, 104.97], [105.0, 106.61], [118.0, 130.44], [133.0, 133.62], [134.0, 141.98], [149.0, 148.83], [150.0, 157.1], [159.0, 181.13], [187.0, 187.15], [188.0, 188.35], [191.0, 195.4], [197.0, 200.6], [201.0, 207.33], [208.0, 208.2]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 30.6, 29.12, 0.0, 31.45, 0.0, 0.0, 31.87, 0.0, 0.0, 31.64, 0.0, 30.57, 0.0, 34.64, 33.09, 0.0, 0.0, 31.45, 31.1, 31.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 62.95], ["hum", 5.15], ["synthesizer", 4.65]], [["music", 36.56], ["hum", 22.94], ["mains hum", 14.78]], null, [["groan", 27.14], ["whack, thwack", 26.86], ["music", 10.47]], null, null, [["whack, thwack", 47.87], ["speech", 33.02], ["thunk", 5.86]], null, null, [["mosquito", 23.52], ["fly, housefly", 15.81], ["noise", 14.8]], null, [["whack, thwack", 54.55], ["music", 8.95], ["speech", 6.19]], null, [["whack, thwack", 49.83], ["smash, crash", 10.38], ["music", 10.1]], [["music", 57.81], ["boing", 8.07], ["fart", 6.67]], null, null, [["fly, housefly", 17.51], ["music", 14.0], ["speech", 9.35]], [["speech", 35.88], ["vehicle", 10.6], ["music", 9.97]], [["electric shaver, electric razor", 34.33], ["speech", 20.23], ["vehicle", 5.75]], null], "duration": [1.41, 1.32, 23.08, 15.44, 1.35, 11.53, 1.98, 0.04, 9.46, 1.97, 1.61, 12.44, 0.62, 7.98, -0.17, 7.1, 22.13, 0.15, 0.35, 4.4, 3.6, 6.33, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/vZlWLj1-eC4_filtered.json b/annotations_filtered/vZlWLj1-eC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50a25ef4af449c05055ed18ac04d9899f396ac00 --- /dev/null +++ b/annotations_filtered/vZlWLj1-eC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [7.0, 7.6], [11.0, 11.4], [12.0, 15.08], [23.0, 23.73], [29.0, 30.16], [32.0, 34.32], [41.0, 44.88], [46.0, 47.51], [51.0, 52.2], [68.0, 71.95], [72.0, 72.05], [76.0, 83.32], [109.0, 109.07], [111.0, 111.77], [113.0, 113.93], [116.0, 116.82], [125.0, 128.68], [130.0, 131.35], [133.0, 133.81], [139.0, 138.74], [140.0, 145.61], [149.0, 150.9], [152.0, 154.55], [159.0, 158.87], [173.0, 173.38], [175.0, 177.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.66, 0.0, 0.0, 36.34, 37.77, 0.0, 0.0, 34.14, 0.0, 33.44, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 96.89, 0.0, 77.2, 0.0, 0.0, 74.13], "audiomae_on_audioset": [null, null, null, [["music", 38.04], ["musical instrument", 17.24], ["guitar", 14.78]], null, null, [["music", 71.97], ["guitar", 6.94], ["musical instrument", 5.06]], [["speech", 37.7], ["music", 14.82], ["musical instrument", 10.67]], null, null, [["music", 44.29], ["zither", 15.74], ["musical instrument", 6.63]], null, [["music", 47.13], ["zither", 8.57], ["pizzicato", 7.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.6, 0.4, 3.08, 0.73, 1.16, 2.32, 3.88, 1.51, 1.2, 3.95, 0.05, 7.32, 0.07, 0.77, 0.93, 0.82, 3.68, 1.35, 0.81, -0.26, 5.61, 1.9, 2.55, -0.13, 0.38, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/vZqr-1GJIAk_filtered.json b/annotations_filtered/vZqr-1GJIAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abe11393b41ecfc5fe0cc17982859ab4e5ddb690 --- /dev/null +++ b/annotations_filtered/vZqr-1GJIAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [3.0, 3.43], [6.0, 6.62], [11.0, 11.4], [16.0, 16.48], [17.0, 17.36], [19.0, 19.55], [20.0, 20.68], [26.0, 27.6], [29.0, 30.72], [33.0, 33.18], [35.0, 38.21], [40.0, 41.59], [43.0, 44.46], [47.0, 48.68], [52.0, 53.28], [55.0, 55.51], [57.0, 57.59], [59.0, 60.07], [62.0, 63.59], [72.0, 71.9], [73.0, 74.33], [76.0, 76.55], [77.0, 77.26], [78.0, 80.2], [82.0, 82.11], [83.0, 93.06], [96.0, 110.0], [113.0, 119.57], [122.0, 127.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 58.22, 32.35, 31.93, 31.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.72], ["fly, housefly", 18.41], ["noise", 11.88]], [["cattle, bovinae", 48.85], ["moo", 22.57], ["livestock, farm animals, working animals", 8.18]], [["livestock, farm animals, working animals", 31.45], ["cattle, bovinae", 20.89], ["moo", 12.98]]], "duration": [0.43, 0.43, 0.62, 0.4, 0.48, 0.36, 0.55, 0.68, 1.6, 1.72, 0.18, 3.21, 1.59, 1.46, 1.68, 1.28, 0.51, 0.59, 1.07, 1.59, -0.1, 1.33, 0.55, 0.26, 2.2, 0.11, 10.06, 14.0, 6.57, 5.35]} \ No newline at end of file diff --git a/annotations_filtered/vZyIBlDO-E8_filtered.json b/annotations_filtered/vZyIBlDO-E8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf2e8ca2d684a165d14beecd0f7a5fd9c7b2304b --- /dev/null +++ b/annotations_filtered/vZyIBlDO-E8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 31.9], [33.0, 33.72], [40.0, 41.62], [43.0, 44.31], [64.0, 81.94], [88.0, 102.32], [108.0, 108.19], [110.0, 109.95], [110.0, 110.93], [115.0, 115.53], [116.0, 122.61], [128.0, 128.66]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [29.79, 0.0, 0.0, 0.0, 30.53, 29.39, 0.0, 0.0, 0.0, 0.0, 29.93, 0.0], "audiomae_on_audioset": [[["music", 62.94], ["throbbing", 6.61], ["electronic music", 2.62]], null, null, null, [["music", 43.54], ["theremin", 10.37], ["mosquito", 10.03]], [["music", 60.24], ["boing", 17.03], ["fart", 8.99]], null, null, null, null, [["cattle, bovinae", 42.79], ["livestock, farm animals, working animals", 26.0], ["moo", 22.47]], null], "duration": [7.9, 0.72, 1.62, 1.31, 17.94, 14.32, 0.19, -0.05, 0.93, 0.53, 6.61, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/v_R9dxNFKWY_filtered.json b/annotations_filtered/v_R9dxNFKWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c10cc13f0f8abb8803f4e6d955b92965029fe5 --- /dev/null +++ b/annotations_filtered/v_R9dxNFKWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 77.67], [79.0, 79.22], [82.0, 99.93], [101.0, 107.52], [108.0, 108.18], [111.0, 110.81], [112.0, 114.62], [115.0, 120.23], [121.0, 170.45], [171.0, 170.58], [171.0, 182.06]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [97.0, 0.0, 66.15, 54.36, 0.0, 0.0, 80.29, 31.29, 0.0, 0.0, 62.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["explosion", 22.46], ["sidetone", 16.4], ["music", 12.4]], null, null, null], "duration": [2.67, 0.22, 17.93, 6.52, 0.18, -0.19, 2.62, 5.23, 49.45, -0.42, 11.06]} \ No newline at end of file diff --git a/annotations_filtered/va6nRaZ9eRg_filtered.json b/annotations_filtered/va6nRaZ9eRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d6852e6b37c9cd27f7aa66ea9a50aa9c09b0a23 --- /dev/null +++ b/annotations_filtered/va6nRaZ9eRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.17], [6.0, 7.18], [8.0, 9.41], [12.0, 13.9], [18.0, 19.52], [23.0, 24.22], [25.0, 26.64], [27.0, 28.27], [36.0, 36.83], [50.0, 51.22], [70.0, 70.9], [81.0, 81.8], [89.0, 89.31], [113.0, 115.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 1.18, 1.41, 1.9, 1.52, 1.22, 1.64, 1.27, 0.83, 1.22, 0.9, 0.8, 0.31, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/vaCI48KHW1k_filtered.json b/annotations_filtered/vaCI48KHW1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f9476e9d27c39fd7b9db70811c88675de726d9 --- /dev/null +++ b/annotations_filtered/vaCI48KHW1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 60.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [47.22]} \ No newline at end of file diff --git a/annotations_filtered/vaJ2yQC_ktY_filtered.json b/annotations_filtered/vaJ2yQC_ktY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..337a7cac4a4b0d3dee7ddfbef90d64f55d44cc26 --- /dev/null +++ b/annotations_filtered/vaJ2yQC_ktY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [17.0, 17.58], [30.0, 31.99], [36.0, 39.75], [41.0, 43.38], [44.0, 45.52], [46.0, 46.57], [47.0, 49.08], [49.0, 50.06], [52.0, 56.03], [61.0, 61.59], [62.0, 63.56], [66.0, 71.9], [79.0, 86.46], [87.0, 87.35], [89.0, 90.37], [115.0, 118.69], [127.0, 130.37], [134.0, 134.7], [136.0, 138.32], [141.0, 142.52], [145.0, 145.2], [148.0, 148.96], [152.0, 154.85], [156.0, 158.14], [159.0, 160.62], [163.0, 163.26], [169.0, 169.62], [191.0, 192.82], [195.0, 202.44], [204.0, 205.58], [216.0, 220.65], [223.0, 222.67], [233.0, 232.88], [245.0, 246.1], [246.0, 255.88], [266.0, 269.27]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.7, 31.75, 0.0, 0.0, 39.89, 0.0, 38.03, 0.0, 0.0, 42.74, 46.15, 0.0, 0.0, 73.67, 99.8, 0.0, 80.64, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 59.15, 0.0, 0.0, 0.0, 95.64, 52.86], "audiomae_on_audioset": [null, null, null, [["moo", 28.24], ["cattle, bovinae", 20.63], ["livestock, farm animals, working animals", 12.16]], [["speech", 40.36], ["music", 33.03], ["boing", 4.54]], null, null, [["music", 30.19], ["speech", 16.47], ["musical instrument", 5.93]], null, [["boing", 56.26], ["ding", 15.87], ["clang", 12.33]], null, null, [["speech", 15.58], ["moo", 9.73], ["cattle, bovinae", 8.6]], [["grunt", 61.83], ["speech", 6.59], ["groan", 6.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.58, 1.99, 3.75, 2.38, 1.52, 0.57, 2.08, 1.06, 4.03, 0.59, 1.56, 5.9, 7.46, 0.35, 1.37, 3.69, 3.37, 0.7, 2.32, 1.52, 0.2, 0.96, 2.85, 2.14, 1.62, 0.26, 0.62, 1.82, 7.44, 1.58, 4.65, -0.33, -0.12, 1.1, 9.88, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/va_wuPBP5kA_filtered.json b/annotations_filtered/va_wuPBP5kA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0838448894bbf4d341df350fbf5297cb70b2cee --- /dev/null +++ b/annotations_filtered/va_wuPBP5kA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 4.95], [5.0, 12.02], [12.0, 13.34], [14.0, 15.57], [16.0, 17.42], [20.0, 21.37], [23.0, 23.52], [24.0, 25.47], [28.0, 27.94], [31.0, 32.49], [35.0, 35.45], [36.0, 41.08], [48.0, 48.84], [54.0, 55.38], [62.0, 62.72], [64.0, 64.74], [67.0, 68.5], [71.0, 73.84], [77.0, 77.01], [81.0, 81.36], [84.0, 87.05], [93.0, 152.78], [170.0, 174.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 46.47, 0.0, 42.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.84], ["musical instrument", 5.69], ["plucked string instrument", 1.03]], null, [["music", 61.56], ["carnatic music", 11.01], ["musical instrument", 6.66]]], "duration": [0.72, -0.05, 7.02, 1.34, 1.57, 1.42, 1.37, 0.52, 1.47, -0.06, 1.49, 0.45, 5.08, 0.84, 1.38, 0.72, 0.74, 1.5, 2.84, 0.01, 0.36, 3.05, 59.78, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/vagva7xKyE8_filtered.json b/annotations_filtered/vagva7xKyE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1f21c3a28c9cf8835e5a30ba579ed2e74e525a --- /dev/null +++ b/annotations_filtered/vagva7xKyE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.91], [27.0, 41.4], [42.0, 42.13], [49.0, 49.23], [58.0, 58.02], [71.0, 70.97], [72.0, 72.5], [77.0, 79.62], [92.0, 94.36], [100.0, 100.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.93, 30.04, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 97.73, 0.0], "audiomae_on_audioset": [[["music", 62.5], ["house music", 10.95], ["dance music", 5.59]], [["music", 83.39], ["house music", 6.86], ["dance music", 2.13]], null, null, null, null, null, null, null, null], "duration": [3.91, 14.4, 0.13, 0.23, 0.02, -0.03, 0.5, 2.62, 2.36, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/vb2GzRckU9s_filtered.json b/annotations_filtered/vb2GzRckU9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8a8b93708cd84124d1e0202f8a3036689af7ae2 --- /dev/null +++ b/annotations_filtered/vb2GzRckU9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.53], [14.0, 13.93], [18.0, 21.44], [23.0, 27.87], [34.0, 35.34], [36.0, 38.03], [41.0, 42.55], [44.0, 50.16], [50.0, 51.22], [58.0, 59.34], [71.0, 71.91], [76.0, 76.6], [79.0, 79.96], [82.0, 82.68], [87.0, 88.3], [91.0, 90.75], [93.0, 93.43], [95.0, 95.44], [97.0, 97.01], [100.0, 100.25], [111.0, 111.69]], "keep_status": [true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.37, 0.0, 37.43, 31.86, 0.0, 48.82, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["rumble", 19.49], ["hum", 17.91], ["mains hum", 17.14]], null, [["music", 20.12], ["hum", 16.98], ["rumble", 13.63]], [["speech", 75.92], ["music", 7.05], ["vehicle", 4.63]], null, [["buzz", 16.71], ["hum", 9.16], ["vehicle", 8.39]], null, [["hum", 28.94], ["speech", 24.54], ["mains hum", 10.67]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.53, -0.07, 3.44, 4.87, 1.34, 2.03, 1.55, 6.16, 1.22, 1.34, 0.91, 0.6, 0.96, 0.68, 1.3, -0.25, 0.43, 0.44, 0.01, 0.25, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/vbF4qz_-PCM_filtered.json b/annotations_filtered/vbF4qz_-PCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a07cc6e192f66f8765eb2ca12dee2e265cfa87 --- /dev/null +++ b/annotations_filtered/vbF4qz_-PCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.49], [9.0, 12.63], [15.0, 19.31], [21.0, 20.92], [23.0, 26.43], [33.0, 33.84], [35.0, 36.15], [39.0, 39.24], [42.0, 42.28], [44.0, 45.2], [51.0, 50.63], [51.0, 51.56], [52.0, 52.79], [57.0, 60.12], [66.0, 67.31], [69.0, 69.33], [75.0, 74.76], [75.0, 75.91], [87.0, 87.45], [90.0, 90.58], [105.0, 105.51], [107.0, 107.87], [109.0, 113.02], [115.0, 115.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 72.75, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.49, 3.63, 4.31, -0.08, 3.43, 0.84, 1.15, 0.24, 0.28, 1.2, -0.37, 0.56, 0.79, 3.12, 1.31, 0.33, -0.24, 0.91, 0.45, 0.58, 0.51, 0.87, 4.02, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/vbJsLuL2YzQ_filtered.json b/annotations_filtered/vbJsLuL2YzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e77501ccf97047a4e00be4df5fb9076e59e6f80a --- /dev/null +++ b/annotations_filtered/vbJsLuL2YzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.49], [15.0, 22.99], [24.0, 28.05], [29.0, 30.1], [34.0, 42.3], [43.0, 43.19], [44.0, 44.91], [48.0, 53.33], [54.0, 54.7], [56.0, 65.77], [67.0, 70.9], [75.0, 75.29], [76.0, 77.77], [79.0, 79.81], [82.0, 110.0], [111.0, 112.01], [114.0, 114.24], [119.0, 119.7], [123.0, 127.06]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [42.58, 44.01, 65.67, 0.0, 49.27, 0.0, 0.0, 40.61, 0.0, 34.3, 33.3, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 70.58], "audiomae_on_audioset": [[["music", 40.44], ["wild animals", 9.56], ["musical instrument", 9.01]], [["music", 61.21], ["speech", 5.36], ["synthesizer", 3.87]], null, null, [["frog", 60.75], ["croak", 12.52], ["music", 11.17]], null, null, [["frog", 82.23], ["music", 4.71], ["croak", 4.0]], null, [["music", 29.36], ["livestock, farm animals, working animals", 19.61], ["animal", 9.62]], [["music", 38.29], ["frog", 13.05], ["animal", 6.64]], null, null, null, [["music", 51.9], ["frog", 20.52], ["groan", 4.77]], null, null, null, null], "duration": [5.49, 7.99, 4.05, 1.1, 8.3, 0.19, 0.91, 5.33, 0.7, 9.77, 3.9, 0.29, 1.77, 0.81, 28.0, 1.01, 0.24, 0.7, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/vbUTbqwKtEE_filtered.json b/annotations_filtered/vbUTbqwKtEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74996ca678013700df6b026841818368c366f35d --- /dev/null +++ b/annotations_filtered/vbUTbqwKtEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [6.0, 7.08], [9.0, 12.73], [14.0, 15.4], [21.0, 21.56], [24.0, 30.05], [32.0, 42.63], [45.0, 46.8], [47.0, 49.05], [50.0, 53.92], [55.0, 69.99], [71.0, 82.07], [85.0, 89.5], [91.0, 92.2], [99.0, 107.37], [129.0, 129.37], [145.0, 144.9], [151.0, 154.21], [156.0, 157.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 99.87, 0.0, 0.0, 98.99, 71.87, 0.0, 62.58, 60.89, 32.82, 32.9, 29.66, 0.0, 35.37, 0.0, 0.0, 41.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 57.1], ["sonar", 16.11], ["hum", 4.4]], [["hum", 27.9], ["mains hum", 16.8], ["rumble", 15.87]], [["music", 20.85], ["gong", 7.79], ["synthesizer", 5.89]], null, [["music", 33.71], ["synthesizer", 23.52], ["musical instrument", 8.7]], null, null, [["music", 27.64], ["theremin", 13.32], ["synthesizer", 11.33]], null], "duration": [0.81, 1.08, 3.73, 1.4, 0.56, 6.05, 10.63, 1.8, 2.05, 3.92, 14.99, 11.07, 4.5, 1.2, 8.37, 0.37, -0.1, 3.21, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/vcURIKX8710_filtered.json b/annotations_filtered/vcURIKX8710_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8595b42ec0d65cc415b4a6d5c38c6bb51d77185c --- /dev/null +++ b/annotations_filtered/vcURIKX8710_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.95], [18.0, 18.67], [26.0, 44.25], [48.0, 51.19], [57.0, 64.49], [66.0, 66.36], [69.0, 70.6], [72.0, 72.67], [73.0, 78.02], [89.0, 91.18], [92.0, 92.94], [100.0, 103.42], [108.0, 108.55], [113.0, 113.32], [122.0, 123.62]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.05, 0.0, 30.7, 30.26, 30.42, 0.0, 0.0, 0.0, 58.72, 59.51, 0.0, 73.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 22.38], ["speech", 21.92], ["hum", 16.58]], [["music", 44.95], ["speech", 14.06], ["throbbing", 12.93]], [["hum", 24.08], ["music", 20.05], ["speech", 15.78]], null, null, null, null, null, null, null, null, null, null], "duration": [2.95, 0.67, 18.25, 3.19, 7.49, 0.36, 1.6, 0.67, 5.02, 2.18, 0.94, 3.42, 0.55, 0.32, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/vcdDRblTOmM_filtered.json b/annotations_filtered/vcdDRblTOmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a31888dc04ade63bd81a4867f4180b24100f87 --- /dev/null +++ b/annotations_filtered/vcdDRblTOmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 17.88], [20.0, 27.53], [28.0, 47.31], [47.0, 85.48], [86.0, 85.72], [86.0, 115.99], [118.0, 124.93], [125.0, 128.16], [129.0, 129.0], [133.0, 133.76], [134.0, 138.65]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [29.5, 29.75, 29.42, 0.0, 0.0, 30.17, 28.89, 29.9, 0.0, 0.0, 29.87], "audiomae_on_audioset": [[["hum", 55.74], ["throbbing", 20.43], ["mains hum", 11.48]], [["throbbing", 48.16], ["hum", 40.92], ["music", 5.25]], [["music", 70.42], ["throbbing", 11.69], ["hum", 3.77]], null, null, [["hum", 52.25], ["mains hum", 39.36], ["throbbing", 2.53]], [["whip", 65.98], ["speech", 5.79], ["whoosh, swoosh, swish", 4.38]], [["music", 23.98], ["throbbing", 21.66], ["hum", 15.02]], null, null, [["hum", 51.73], ["mains hum", 20.44], ["throbbing", 4.16]]], "duration": [16.88, 7.53, 19.31, 38.48, -0.28, 29.99, 6.93, 3.16, 0.0, 0.76, 4.65]} \ No newline at end of file diff --git a/annotations_filtered/vcw4b2U_0nU_filtered.json b/annotations_filtered/vcw4b2U_0nU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/vcw4b2U_0nU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/vcxEgyiu16Q_filtered.json b/annotations_filtered/vcxEgyiu16Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d39409e84ac2fb3ddef79be81ebf2323e874d9c --- /dev/null +++ b/annotations_filtered/vcxEgyiu16Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.05], [10.0, 12.53], [13.0, 20.49], [21.0, 20.7], [21.0, 20.73], [21.0, 21.37], [22.0, 22.6], [25.0, 33.0], [35.0, 35.63], [36.0, 37.84], [40.0, 40.47], [41.0, 44.1], [45.0, 45.74], [51.0, 51.43], [53.0, 53.37], [54.0, 55.29], [56.0, 56.57], [58.0, 58.13], [60.0, 62.23], [64.0, 66.04], [67.0, 71.66], [72.0, 72.49], [74.0, 74.34], [76.0, 76.64], [78.0, 78.68], [79.0, 80.72], [83.0, 84.87], [86.0, 87.54], [89.0, 93.45], [100.0, 99.93], [103.0, 103.0], [103.0, 103.13], [103.0, 104.04], [108.0, 108.33], [112.0, 112.9], [118.0, 118.12], [121.0, 121.37], [125.0, 126.03], [128.0, 128.07], [129.0, 133.54], [135.0, 136.17]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.28, 32.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 50.41, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.9, 0.0], "audiomae_on_audioset": [null, [["music", 21.76], ["whale vocalization", 12.35], ["didgeridoo", 11.31]], [["fly, housefly", 30.77], ["sine wave", 9.14], ["mosquito", 7.61]], null, null, null, null, null, null, null, null, [["whale vocalization", 42.16], ["sidetone", 19.62], ["speech", 13.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 48.52], ["throbbing", 25.11], ["mains hum", 11.44]], null], "duration": [0.05, 2.53, 7.49, -0.3, -0.27, 0.37, 0.6, 8.0, 0.63, 1.84, 0.47, 3.1, 0.74, 0.43, 0.37, 1.29, 0.57, 0.13, 2.23, 2.04, 4.66, 0.49, 0.34, 0.64, 0.68, 1.72, 1.87, 1.54, 4.45, -0.07, 0.0, 0.13, 1.04, 0.33, 0.9, 0.12, 0.37, 1.03, 0.07, 4.54, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/vdED1lRQ-N8_filtered.json b/annotations_filtered/vdED1lRQ-N8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f321cdffbb5c6def47d4a56f7c2620fa526e769e --- /dev/null +++ b/annotations_filtered/vdED1lRQ-N8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.96], [9.0, 9.31], [14.0, 14.27], [15.0, 15.42], [17.0, 17.79], [22.0, 23.03], [25.0, 26.06], [27.0, 30.37], [30.0, 30.47], [31.0, 32.56], [33.0, 33.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, 0.31, 0.27, 0.42, 0.79, 1.03, 1.06, 3.37, 0.47, 1.56, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/vdHBsWXaHN8_filtered.json b/annotations_filtered/vdHBsWXaHN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3db45bfbe59fa279bc84cbfa6d266a72f1faa759 --- /dev/null +++ b/annotations_filtered/vdHBsWXaHN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.18], [7.0, 8.9], [10.0, 16.73], [19.0, 20.58], [25.0, 25.76], [30.0, 32.76], [35.0, 40.22]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [31.77, 0.0, 34.61, 0.0, 0.0, 34.56, 30.76], "audiomae_on_audioset": [[["music", 75.34], ["musical instrument", 2.4], ["hum", 1.89]], null, [["music", 88.51], ["guitar", 2.54], ["musical instrument", 1.71]], null, null, [["music", 88.11], ["synthesizer", 0.93], ["throbbing", 0.88]], [["music", 88.62], ["hum", 2.27], ["throbbing", 1.64]]], "duration": [2.18, 1.9, 6.73, 1.58, 0.76, 2.76, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/vdMEu03CjTk_filtered.json b/annotations_filtered/vdMEu03CjTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5920e0e82fd7165e44ed3eaf3f43216a9335583e --- /dev/null +++ b/annotations_filtered/vdMEu03CjTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.03], [28.0, 65.15], [67.0, 82.22], [84.0, 85.08], [86.0, 87.61], [89.0, 90.69], [93.0, 93.38], [99.0, 100.14], [102.0, 102.32], [104.0, 105.09], [106.0, 106.95], [109.0, 111.15], [113.0, 114.08], [115.0, 116.9], [119.0, 120.46], [122.0, 124.39], [128.0, 127.63], [130.0, 130.99], [133.0, 134.05], [135.0, 136.59], [137.0, 138.05], [141.0, 140.8], [149.0, 155.6], [156.0, 157.65], [159.0, 161.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 84.98], "audiomae_on_audioset": [null, null, [["music", 17.53], ["hum", 16.68], ["breaking", 9.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 37.15, 15.22, 1.08, 1.61, 1.69, 0.38, 1.14, 0.32, 1.09, 0.95, 2.15, 1.08, 1.9, 1.46, 2.39, -0.37, 0.99, 1.05, 1.59, 1.05, -0.2, 6.6, 1.65, 2.76]} \ No newline at end of file diff --git a/annotations_filtered/vdbQpDHAq5U_filtered.json b/annotations_filtered/vdbQpDHAq5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4516d98d2580c8a839375ce842a3df7691f46b73 --- /dev/null +++ b/annotations_filtered/vdbQpDHAq5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [8.0, 9.27], [12.0, 13.66], [16.0, 16.66], [27.0, 28.11]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.81, 1.27, 1.66, 0.66, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/vdnA-ESWcPs_filtered.json b/annotations_filtered/vdnA-ESWcPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4d74bb780ed3de30e07bfca3c642317461406d0 --- /dev/null +++ b/annotations_filtered/vdnA-ESWcPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 81.36], [83.0, 82.61], [84.0, 102.76], [104.0, 122.12]], "keep_status": [true, false, false, true], "silence_prob": [39.43, 0.0, 37.27, 36.63], "audiomae_on_audioset": [[["music", 56.76], ["musical instrument", 7.31], ["clarinet", 4.47]], null, [["music", 42.64], ["brass instrument", 16.8], ["musical instrument", 10.86]], [["music", 48.16], ["speech", 9.59], ["musical instrument", 6.02]]], "duration": [18.36, -0.39, 18.76, 18.12]} \ No newline at end of file diff --git a/annotations_filtered/vdpUDOxQ0ao_filtered.json b/annotations_filtered/vdpUDOxQ0ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..768fba300d3fba996413e59c2492f38883912775 --- /dev/null +++ b/annotations_filtered/vdpUDOxQ0ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.29], [10.0, 12.29], [13.0, 15.84], [19.0, 19.43], [20.0, 20.95], [23.0, 25.14], [28.0, 28.59], [30.0, 31.82], [40.0, 39.77], [42.0, 43.11], [44.0, 47.04], [48.0, 48.56], [49.0, 49.5], [51.0, 51.75], [53.0, 52.86], [54.0, 55.09]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.24, 35.59, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 28.99], ["speech", 8.38], ["civil defense siren", 6.9]], [["music", 71.92], ["guitar", 7.0], ["plucked string instrument", 3.68]], null, null, [["speech", 14.96], ["music", 10.02], ["sheep", 8.11]], null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 2.29, 2.84, 0.43, 0.95, 2.14, 0.59, 1.82, -0.23, 1.11, 3.04, 0.56, 0.5, 0.75, -0.14, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/vdq609Xci-g_filtered.json b/annotations_filtered/vdq609Xci-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..376ab5ef2c2d5849e06bb1add97d9ceac0427d03 --- /dev/null +++ b/annotations_filtered/vdq609Xci-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [14.0, 14.72], [28.0, 28.66], [35.0, 35.77], [40.0, 39.95], [43.0, 43.53], [45.0, 44.81], [48.0, 47.75], [59.0, 60.1], [61.0, 66.23], [67.0, 73.67], [74.0, 77.28], [80.0, 80.42], [82.0, 84.4], [86.0, 89.11], [90.0, 101.04], [103.0, 105.41], [107.0, 109.66], [113.0, 117.68], [119.0, 120.48], [121.0, 122.35], [123.0, 123.97], [125.0, 126.69]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.72, 46.68, 38.1, 0.0, 38.23, 45.65, 52.92, 59.68, 46.97, 39.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 26.44], ["throbbing", 23.68], ["hum", 13.48]], [["hum", 46.12], ["speech", 15.42], ["mains hum", 11.56]], [["music", 34.37], ["throbbing", 14.16], ["hum", 12.36]], null, [["music", 69.41], ["electronic music", 3.75], ["synthesizer", 2.26]], [["music", 49.04], ["throbbing", 10.36], ["hum", 9.16]], null, null, [["hum", 17.76], ["music", 16.13], ["thunk", 6.24]], [["music", 22.02], ["whack, thwack", 12.84], ["thunk", 10.18]], null, null, null, null], "duration": [-0.06, 0.72, 0.66, 0.77, -0.05, 0.53, -0.19, -0.25, 1.1, 5.23, 6.67, 3.28, 0.42, 2.4, 3.11, 11.04, 2.41, 2.66, 4.68, 1.48, 1.35, 0.97, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/vdyYR85RNkk_filtered.json b/annotations_filtered/vdyYR85RNkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10ea20dc44d2a88cad0bb658606d270aad589a8c --- /dev/null +++ b/annotations_filtered/vdyYR85RNkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.0], [15.0, 18.25], [21.0, 23.68], [32.0, 34.16], [36.0, 36.61], [37.0, 58.19], [60.0, 59.7], [60.0, 72.99], [74.0, 75.27], [79.0, 80.28], [83.0, 82.9], [84.0, 86.12], [88.0, 88.42], [90.0, 96.58], [100.0, 101.24], [105.0, 120.01]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 82.07, 99.91, 98.36, 0.0, 64.52, 0.0, 34.11, 0.0, 0.0, 0.0, 77.53, 0.0, 96.04, 0.0, 89.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 26.63], ["mains hum", 17.09], ["music", 11.56]], null, null, null, null, null, null, null, null], "duration": [6.0, 3.25, 2.68, 2.16, 0.61, 21.19, -0.3, 12.99, 1.27, 1.28, -0.1, 2.12, 0.42, 6.58, 1.24, 15.01]} \ No newline at end of file diff --git a/annotations_filtered/vejLIHky2HE_filtered.json b/annotations_filtered/vejLIHky2HE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b8f3de0e329697585a37964c0f6f7f094c682cb --- /dev/null +++ b/annotations_filtered/vejLIHky2HE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [8.0, 10.96], [13.0, 14.07], [16.0, 17.07], [19.0, 28.66], [30.0, 31.53], [33.0, 34.4], [35.0, 37.07], [39.0, 40.29], [47.0, 47.51], [55.0, 55.56], [67.0, 69.89]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.97, 0.0, 0.0, 57.09, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 58.72], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 13.97], ["moo", 12.77], ["music", 11.52]], null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 2.96, 1.07, 1.07, 9.66, 1.53, 1.4, 2.07, 1.29, 0.51, 0.56, 2.89]} \ No newline at end of file diff --git a/annotations_filtered/veztNJQyRJg_filtered.json b/annotations_filtered/veztNJQyRJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab3ae74db7288b82c8519006564603198479540e --- /dev/null +++ b/annotations_filtered/veztNJQyRJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.4], [8.0, 12.56], [16.0, 16.17], [17.0, 18.37], [20.0, 23.14], [25.0, 36.09], [36.0, 36.12], [36.0, 36.37], [36.0, 38.15], [40.0, 44.39], [46.0, 69.97], [72.0, 72.79], [82.0, 82.71], [84.0, 85.48], [86.0, 86.8], [90.0, 120.19], [120.0, 120.43], [120.0, 120.46], [121.0, 122.01], [124.0, 124.19], [127.0, 127.62], [131.0, 136.49], [143.0, 143.73], [148.0, 149.47], [152.0, 176.34]], "keep_status": [false, true, false, false, false, true, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 40.31, 0.0, 0.0, 51.44, 37.42, 0.0, 0.0, 34.11, 36.44, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 0.0, 32.91], "audiomae_on_audioset": [null, [["crushing", 15.45], ["fly, housefly", 14.05], ["insect", 5.71]], null, null, null, [["speech", 34.47], ["music", 17.09], ["microwave oven", 8.58]], null, null, [["creak", 25.08], ["chink, clink", 5.92], ["breaking", 5.33]], [["hum", 26.69], ["mains hum", 17.94], ["music", 15.13]], [["hammer", 30.1], ["music", 18.07], ["synthesizer", 17.42]], null, null, null, null, null, null, null, null, null, null, [["hum", 36.74], ["mains hum", 14.09], ["throbbing", 8.98]], null, null, [["speech", 58.79], ["knock", 4.11], ["glass", 3.49]]], "duration": [0.4, 4.56, 0.17, 1.37, 3.14, 11.09, 0.12, 0.37, 2.15, 4.39, 23.97, 0.79, 0.71, 1.48, 0.8, 30.19, 0.43, 0.46, 1.01, 0.19, 0.62, 5.49, 0.73, 1.47, 24.34]} \ No newline at end of file diff --git a/annotations_filtered/vf6PZfksmfg_filtered.json b/annotations_filtered/vf6PZfksmfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..311e1be868c7ed1907620249433ce0f67e76422d --- /dev/null +++ b/annotations_filtered/vf6PZfksmfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [9.0, 9.17], [11.0, 11.31], [16.0, 15.84], [17.0, 17.66], [20.0, 20.7], [30.0, 30.77], [32.0, 32.36], [41.0, 41.89], [49.0, 50.08], [53.0, 54.23], [58.0, 58.11], [61.0, 62.14], [75.0, 75.25], [78.0, 79.83], [82.0, 82.7], [87.0, 87.47], [89.0, 89.65], [91.0, 92.1], [93.0, 94.26], [98.0, 98.36], [100.0, 100.6], [102.0, 103.05], [105.0, 106.02], [109.0, 110.2], [112.0, 113.21], [114.0, 114.88], [116.0, 116.67], [117.0, 125.36], [127.0, 127.67], [128.0, 129.36], [130.0, 132.92], [136.0, 138.27], [143.0, 148.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99, 0.0, 0.0, 41.22, 33.7, 33.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.85], ["theremin", 33.83], ["foghorn", 6.19]], null, null, [["speech", 43.8], ["music", 23.0], ["hum", 4.14]], [["music", 67.65], ["effects unit", 7.3], ["musical instrument", 4.48]], [["music", 57.4], ["foghorn", 9.82], ["brass instrument", 6.68]]], "duration": [0.31, 0.17, 0.31, -0.16, 0.66, 0.7, 0.77, 0.36, 0.89, 1.08, 1.23, 0.11, 1.14, 0.25, 1.83, 0.7, 0.47, 0.65, 1.1, 1.26, 0.36, 0.6, 1.05, 1.02, 1.2, 1.21, 0.88, 0.67, 8.36, 0.67, 1.36, 2.92, 2.27, 5.12]} \ No newline at end of file diff --git a/annotations_filtered/vf6nfEZgorY_filtered.json b/annotations_filtered/vf6nfEZgorY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08bb61ac16d5d692068fc66d8a87a912733452d8 --- /dev/null +++ b/annotations_filtered/vf6nfEZgorY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 32.31], [33.0, 38.69]], "keep_status": [false, true], "silence_prob": [32.43, 30.9], "audiomae_on_audioset": [[["throbbing", 50.09], ["hum", 27.21], ["music", 9.53]], [["music", 17.39], ["vehicle", 13.05], ["hum", 6.56]]], "duration": [18.31, 5.69]} \ No newline at end of file diff --git a/annotations_filtered/vfIUYDjo8WM_filtered.json b/annotations_filtered/vfIUYDjo8WM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e6c1845229d751d8aeecd3c07a8b927d67dcb5f --- /dev/null +++ b/annotations_filtered/vfIUYDjo8WM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 46.47], [51.0, 59.51], [61.0, 61.23], [62.0, 72.23], [74.0, 90.48], [92.0, 134.69], [137.0, 138.65]], "keep_status": [false, false, false, true, true, false, false], "silence_prob": [0.0, 30.06, 0.0, 30.29, 30.47, 0.0, 0.0], "audiomae_on_audioset": [null, [["eruption", 46.0], ["speech", 14.62], ["explosion", 14.41]], null, [["speech", 45.17], ["music", 9.71], ["hum", 8.65]], [["music", 19.39], ["field recording", 12.42], ["buzz", 11.5]], null, null], "duration": [35.47, 8.51, 0.23, 10.23, 16.48, 42.69, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/vfc3TGvcjEY_filtered.json b/annotations_filtered/vfc3TGvcjEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bbb0e807669657f5e3f5be9b8f71ef8f9bd134d --- /dev/null +++ b/annotations_filtered/vfc3TGvcjEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 104.14], [106.0, 108.14], [109.0, 110.17], [112.0, 113.27], [115.0, 116.46], [119.0, 120.33], [123.0, 123.3], [124.0, 132.49], [140.0, 169.53], [173.0, 184.5], [188.0, 195.91], [201.0, 202.63]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [35.52, 37.07, 0.0, 0.0, 0.0, 0.0, 0.0, 35.97, 30.28, 30.32, 31.46, 0.0], "audiomae_on_audioset": [[["music", 60.14], ["throbbing", 10.42], ["electronic music", 3.98]], [["music", 62.68], ["electronic music", 5.48], ["dubstep", 4.73]], null, null, null, null, null, [["music", 55.37], ["electronic music", 9.05], ["throbbing", 7.99]], [["music", 41.37], ["fart", 8.58], ["groan", 5.51]], [["music", 36.64], ["speech", 11.27], ["electronic music", 11.0]], [["music", 55.82], ["moo", 8.05], ["livestock, farm animals, working animals", 6.81]], null], "duration": [6.14, 2.14, 1.17, 1.27, 1.46, 1.33, 0.3, 8.49, 29.53, 11.5, 7.91, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/vfutImUbN7M_filtered.json b/annotations_filtered/vfutImUbN7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..653e9c58a52959cbd621e98940c512e39d380298 --- /dev/null +++ b/annotations_filtered/vfutImUbN7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [7.0, 8.28], [14.0, 15.26], [19.0, 20.97], [22.0, 23.45], [24.0, 24.66], [29.0, 29.76], [33.0, 33.64], [35.0, 35.4], [36.0, 36.96], [41.0, 41.37], [47.0, 47.55], [52.0, 53.05], [70.0, 71.29], [72.0, 76.45], [82.0, 83.1], [91.0, 93.82], [100.0, 100.36], [103.0, 102.93], [105.0, 107.43], [108.0, 108.62], [109.0, 110.76], [113.0, 113.16], [114.0, 114.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.72, 0.0, 38.98, 0.0, 0.0, 43.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.83], ["music", 15.24], ["mains hum", 5.2]], null, [["music", 66.96], ["musical instrument", 5.63], ["guitar", 3.42]], null, null, [["speech", 51.7], ["music", 9.25], ["keys jangling", 7.86]], null, null, null, null], "duration": [1.48, 1.28, 1.26, 1.97, 1.45, 0.66, 0.76, 0.64, 0.4, 0.96, 0.37, 0.55, 1.05, 1.29, 4.45, 1.1, 2.82, 0.36, -0.07, 2.43, 0.62, 1.76, 0.16, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/vg6-AbLe5nM_filtered.json b/annotations_filtered/vg6-AbLe5nM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09c3c328d2f8fc1052794c11168f3a3396e2547 --- /dev/null +++ b/annotations_filtered/vg6-AbLe5nM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.74], [14.0, 14.77], [19.0, 19.6], [22.0, 22.1], [23.0, 24.06], [25.0, 25.12], [26.0, 27.24], [32.0, 33.02], [36.0, 41.88], [43.0, 43.98], [46.0, 48.74], [49.0, 51.63], [52.0, 53.0], [54.0, 55.05], [56.0, 57.75], [59.0, 59.88], [66.0, 66.24], [75.0, 75.54], [79.0, 79.74], [89.0, 90.24], [92.0, 92.57], [97.0, 97.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.74, 0.0, 71.72, 63.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.74, 0.77, 0.6, 0.1, 1.06, 0.12, 1.24, 1.02, 5.88, 0.98, 2.74, 2.63, 1.0, 1.05, 1.75, 0.88, 0.24, 0.54, 0.74, 1.24, 0.57, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/vgEq476aHxk_filtered.json b/annotations_filtered/vgEq476aHxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a110e6267c89c7461e03892205b5f175e518e1f --- /dev/null +++ b/annotations_filtered/vgEq476aHxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [7.0, 16.95], [21.0, 35.63], [36.0, 64.07], [79.0, 79.51], [80.0, 79.61], [82.0, 85.28], [86.0, 110.35], [115.0, 119.3], [124.0, 130.01], [133.0, 133.32], [133.0, 152.93]], "keep_status": [false, true, false, true, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 28.8, 28.79, 28.66, 0.0, 0.0, 29.35, 28.77, 28.47, 28.56, 0.0, 28.46], "audiomae_on_audioset": [null, [["music", 30.0], ["mains hum", 19.73], ["hum", 16.69]], [["speech", 66.75], ["music", 9.21], ["vehicle", 7.09]], [["music", 47.49], ["vehicle", 8.46], ["buzz", 6.04]], null, null, [["vehicle", 26.59], ["music", 25.65], ["buzz", 7.74]], [["buzz", 24.82], ["hum", 19.54], ["music", 14.12]], [["vehicle", 33.74], ["buzz", 27.57], ["car", 9.91]], [["hum", 32.77], ["throbbing", 19.82], ["music", 18.53]], null, [["speech", 45.09], ["music", 19.01], ["whack, thwack", 5.25]]], "duration": [0.45, 9.95, 14.63, 28.07, 0.51, -0.39, 3.28, 24.35, 4.3, 6.01, 0.32, 19.93]} \ No newline at end of file diff --git a/annotations_filtered/vgGb9tSOKbs_filtered.json b/annotations_filtered/vgGb9tSOKbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/vgGb9tSOKbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/vh-mdPoc92Y_filtered.json b/annotations_filtered/vh-mdPoc92Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4608dd4276e81d4fb04811e93645e1278af30bb --- /dev/null +++ b/annotations_filtered/vh-mdPoc92Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.37], [7.0, 8.56], [11.0, 11.03], [12.0, 24.71], [30.0, 35.92], [36.0, 37.17], [39.0, 39.9], [41.0, 41.18], [42.0, 43.14], [44.0, 127.25], [129.0, 130.82], [132.0, 135.9], [137.0, 138.28], [139.0, 143.36], [144.0, 156.02]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.29, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 37.42, 34.64], "audiomae_on_audioset": [null, null, null, [["fart", 24.29], ["music", 16.86], ["noise", 10.21]], [["fart", 22.83], ["speech", 11.5], ["whack, thwack", 10.86]], null, null, null, null, null, null, null, null, [["didgeridoo", 61.74], ["music", 24.06], ["musical instrument", 6.1]], [["didgeridoo", 36.59], ["music", 36.37], ["musical instrument", 3.8]]], "duration": [0.37, 1.56, 0.03, 12.71, 5.92, 1.17, 0.9, 0.18, 1.14, 83.25, 1.82, 3.9, 1.28, 4.36, 12.02]} \ No newline at end of file diff --git a/annotations_filtered/vh7_WKODlE8_filtered.json b/annotations_filtered/vh7_WKODlE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..085cfc36998c1e29b1ea9405e0d3176a07d8c2f2 --- /dev/null +++ b/annotations_filtered/vh7_WKODlE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [2.0, 2.98], [7.0, 8.63], [10.0, 18.42], [20.0, 21.86], [22.0, 31.08], [33.0, 44.39], [45.0, 47.87], [50.0, 50.8], [51.0, 54.53], [55.0, 60.84], [63.0, 68.28], [69.0, 71.0], [72.0, 76.45], [83.0, 85.23], [87.0, 87.52], [90.0, 90.05], [93.0, 94.0], [98.0, 98.69], [106.0, 106.71], [107.0, 111.1], [112.0, 112.99], [116.0, 116.43], [120.0, 124.78], [129.0, 130.76], [131.0, 134.1], [134.0, 134.18], [135.0, 135.28], [137.0, 138.33], [139.0, 145.12], [146.0, 148.49], [150.0, 151.87], [156.0, 162.97], [164.0, 166.21], [167.0, 169.91], [171.0, 171.93], [173.0, 181.95], [184.0, 184.01]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.46, 0.0, 41.68, 45.85, 73.82, 0.0, 40.79, 55.96, 44.57, 36.49, 52.51, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 33.9, 0.0, 0.0, 33.69, 0.0, 32.83, 0.0, 0.0, 0.0, 35.97, 39.38, 0.0, 71.57, 96.29, 96.29, 0.0, 49.68, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 36.36], ["mains hum", 24.82], ["speech", 8.92]], null, [["speech", 31.27], ["music", 5.49], ["hum", 5.49]], [["speech", 34.65], ["music", 12.12], ["hum", 8.47]], null, null, [["music", 44.18], ["speech", 10.16], ["whale vocalization", 7.42]], null, [["speech", 27.02], ["music", 26.25], ["whale vocalization", 15.58]], [["music", 23.48], ["didgeridoo", 13.95], ["boing", 6.95]], null, null, null, null, null, null, null, [["speech", 21.9], ["sine wave", 19.33], ["chirp tone", 11.7]], null, null, [["music", 32.21], ["beatboxing", 26.68], ["speech", 16.44]], null, [["speech", 57.59], ["gong", 13.01], ["singing bowl", 5.66]], null, null, null, [["speech", 36.92], ["music", 16.96], ["didgeridoo", 5.23]], [["music", 27.61], ["didgeridoo", 17.15], ["speech", 12.61]], null, null, null, null, null, [["speech", 67.34], ["animal", 6.84], ["inside, small room", 3.26]], null], "duration": [0.04, 0.98, 1.63, 8.42, 1.86, 9.08, 11.39, 2.87, 0.8, 3.53, 5.84, 5.28, 2.0, 4.45, 2.23, 0.52, 0.05, 1.0, 0.69, 0.71, 4.1, 0.99, 0.43, 4.78, 1.76, 3.1, 0.18, 0.28, 1.33, 6.12, 2.49, 1.87, 6.97, 2.21, 2.91, 0.93, 8.95, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/vhEOInyNr54_filtered.json b/annotations_filtered/vhEOInyNr54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1265e5e660b760d934eeb2c2de4a19d6a062e05e --- /dev/null +++ b/annotations_filtered/vhEOInyNr54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.88], [6.0, 9.24], [13.0, 13.26], [14.0, 13.78], [14.0, 19.55], [21.0, 23.23], [24.0, 24.76], [25.0, 25.69], [27.0, 27.62], [30.0, 31.46], [33.0, 35.45], [37.0, 37.94], [38.0, 40.12], [41.0, 42.13], [43.0, 43.44], [45.0, 45.39], [46.0, 46.18], [47.0, 47.75], [49.0, 49.54], [51.0, 53.32], [54.0, 55.78], [59.0, 59.58], [64.0, 64.25], [67.0, 70.34], [72.0, 74.11], [80.0, 80.4], [83.0, 84.84], [85.0, 86.26], [88.0, 88.7], [90.0, 90.19], [95.0, 95.07], [96.0, 97.29], [100.0, 118.69], [126.0, 126.57], [128.0, 131.6], [133.0, 133.64], [137.0, 136.9], [140.0, 141.27], [142.0, 142.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [78.89, 79.41, 0.0, 0.0, 93.13, 97.83, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 43.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 76.7, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.48], ["sidetone", 20.29], ["sine wave", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.7], ["musical instrument", 2.91], ["theremin", 2.8]], null, null, null, null], "duration": [2.88, 3.24, 0.26, -0.22, 5.55, 2.23, 0.76, 0.69, 0.62, 1.46, 2.45, 0.94, 2.12, 1.13, 0.44, 0.39, 0.18, 0.75, 0.54, 2.32, 1.78, 0.58, 0.25, 3.34, 2.11, 0.4, 1.84, 1.26, 0.7, 0.19, 0.07, 1.29, 18.69, 0.57, 3.6, 0.64, -0.1, 1.27, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/vhQ4S5ajwDQ_filtered.json b/annotations_filtered/vhQ4S5ajwDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fef6128aed6ffa52ca56ac7be78d3b6f2edd6da7 --- /dev/null +++ b/annotations_filtered/vhQ4S5ajwDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.01], [17.0, 22.91], [26.0, 26.57], [32.0, 32.43], [40.0, 40.49], [52.0, 52.3], [56.0, 57.03], [59.0, 58.56], [78.0, 78.41], [98.0, 98.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 60.36], ["musical instrument", 6.55], ["guitar", 4.41]], null, null, null, null, null, null, null, null], "duration": [1.01, 5.91, 0.57, 0.43, 0.49, 0.3, 1.03, -0.44, 0.41, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/vhfk-aOAgIE_filtered.json b/annotations_filtered/vhfk-aOAgIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..477e7a580a72d7d9ac6203bfea5b9085700354be --- /dev/null +++ b/annotations_filtered/vhfk-aOAgIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 41.15], [47.0, 47.19], [48.0, 70.68]], "keep_status": [false, false, false], "silence_prob": [32.84, 0.0, 33.1], "audiomae_on_audioset": [[["music", 80.27], ["boing", 3.1], ["sampler", 1.62]], null, [["music", 54.47], ["cattle, bovinae", 10.56], ["moo", 10.06]]], "duration": [3.15, 0.19, 22.68]} \ No newline at end of file diff --git a/annotations_filtered/vhhiJqQBMMY_filtered.json b/annotations_filtered/vhhiJqQBMMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbb693a209c5c041e155a21c4f78e464e4b7625 --- /dev/null +++ b/annotations_filtered/vhhiJqQBMMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.56], [9.0, 10.22], [20.0, 21.63], [23.0, 22.91], [23.0, 24.02], [25.0, 25.56], [27.0, 27.35], [28.0, 28.9], [30.0, 31.38], [33.0, 33.96], [35.0, 37.29], [43.0, 42.87], [44.0, 46.28], [49.0, 49.57], [53.0, 53.72], [54.0, 55.49], [63.0, 68.25], [73.0, 75.07], [75.0, 76.25], [78.0, 78.75], [85.0, 85.78], [100.0, 100.16], [101.0, 101.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.98, 0.0, 37.4, 0.0, 0.0, 0.0, 37.35, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 19.35], ["didgeridoo", 9.35], ["speech", 8.65]], null, [["music", 59.02], ["speech", 7.05], ["theremin", 2.88]], null, null, null, [["music", 67.65], ["didgeridoo", 5.53], ["animal", 2.95]], [["speech", 36.2], ["music", 16.15], ["sidetone", 8.13]], null, null, null, null, null], "duration": [1.56, 1.22, 1.63, -0.09, 1.02, 0.56, 0.35, 0.9, 1.38, 0.96, 2.29, -0.13, 2.28, 0.57, 0.72, 1.49, 5.25, 2.07, 1.25, 0.75, 0.78, 0.16, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/vhmFJKHhdw4_filtered.json b/annotations_filtered/vhmFJKHhdw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..136db0bfca957966643c7758fe90e37db9cb2990 --- /dev/null +++ b/annotations_filtered/vhmFJKHhdw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [3.0, 3.48], [5.0, 9.37], [11.0, 14.93], [18.0, 18.57], [22.0, 22.62], [29.0, 30.16], [37.0, 37.54], [46.0, 47.53], [59.0, 59.53], [73.0, 73.82], [76.0, 77.06], [77.0, 80.11], [87.0, 87.62], [94.0, 95.37], [110.0, 135.55], [138.0, 138.57], [142.0, 142.79], [153.0, 153.39], [155.0, 156.88], [166.0, 168.76], [182.0, 182.97], [186.0, 185.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.42, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 58.15], ["music", 21.28], ["fart", 6.11]], [["music", 67.14], ["musical instrument", 10.89], ["synthesizer", 7.78]], null, null, null, null, null, null, null, null, [["music", 51.77], ["speech", 6.55], ["didgeridoo", 3.75]], null, null, [["music", 58.6], ["musical instrument", 4.78], ["effects unit", 3.32]], null, null, null, null, [["music", 30.0], ["carnatic music", 16.96], ["moo", 6.45]], null, null], "duration": [-0.05, 0.48, 4.37, 3.93, 0.57, 0.62, 1.16, 0.54, 1.53, 0.53, 0.82, 1.06, 3.11, 0.62, 1.37, 25.55, 0.57, 0.79, 0.39, 1.88, 2.76, 0.97, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/vi9m0JRo71I_filtered.json b/annotations_filtered/vi9m0JRo71I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2e0d38701aae2a13207d543137eaf60a4a54fa0 --- /dev/null +++ b/annotations_filtered/vi9m0JRo71I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.0], [14.0, 17.86], [22.0, 22.42], [24.0, 72.52], [73.0, 75.71], [80.0, 101.38], [110.0, 111.69], [112.0, 112.26], [112.0, 112.29], [113.0, 122.84], [125.0, 139.01]], "keep_status": [true, true, false, false, false, true, false, false, false, true, false], "silence_prob": [46.12, 47.46, 0.0, 0.0, 56.7, 29.41, 0.0, 0.0, 0.0, 29.32, 29.74], "audiomae_on_audioset": [[["rumble", 37.13], ["hum", 11.02], ["throbbing", 9.41]], [["fly, housefly", 20.77], ["bee, wasp, etc.", 15.89], ["speech", 10.08]], null, null, null, [["vehicle", 20.55], ["whale vocalization", 13.26], ["buzz", 12.51]], null, null, null, [["grunt", 35.18], ["whale vocalization", 19.55], ["music", 12.63]], [["speech", 64.06], ["music", 28.4], ["animal", 0.81]]], "duration": [3.0, 3.86, 0.42, 48.52, 2.71, 21.38, 1.69, 0.26, 0.29, 9.84, 14.01]} \ No newline at end of file diff --git a/annotations_filtered/viCosY2u6YU_filtered.json b/annotations_filtered/viCosY2u6YU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff89114752c36164142f730b266aef0867a05f28 --- /dev/null +++ b/annotations_filtered/viCosY2u6YU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [19.0, 19.87], [40.0, 51.09], [57.0, 57.2], [58.0, 58.48], [61.0, 62.4], [70.0, 73.23], [96.0, 97.01], [98.0, 97.83], [102.0, 103.01], [104.0, 105.95], [106.0, 106.47], [111.0, 111.69], [113.0, 112.95], [115.0, 115.06], [116.0, 116.72], [118.0, 126.4]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.18, 0.0, 0.0, 0.0, 31.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.47], "audiomae_on_audioset": [null, null, [["speech", 45.49], ["sidetone", 16.54], ["music", 6.7]], null, null, null, [["music", 20.68], ["throbbing", 8.7], ["rumble", 8.5]], null, null, null, null, null, null, null, null, null, [["speech", 50.63], ["fart", 9.37], ["inside, small room", 9.03]]], "duration": [1.62, 0.87, 11.09, 0.2, 0.48, 1.4, 3.23, 1.01, -0.17, 1.01, 1.95, 0.47, 0.69, -0.05, 0.06, 0.72, 8.4]} \ No newline at end of file diff --git a/annotations_filtered/vj3mnCSJq7E_filtered.json b/annotations_filtered/vj3mnCSJq7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5112a2e5397a31043ed88984fec7b944f294da20 --- /dev/null +++ b/annotations_filtered/vj3mnCSJq7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.64], [35.0, 35.06], [39.0, 38.6], [43.0, 42.72], [43.0, 43.53], [46.0, 46.99], [53.0, 56.66], [58.0, 59.71], [61.0, 61.16], [62.0, 62.51], [64.0, 65.97], [70.0, 69.9], [71.0, 73.6], [75.0, 77.21], [78.0, 78.49], [80.0, 81.68], [82.0, 85.43], [87.0, 88.75], [95.0, 95.3], [98.0, 104.35], [105.0, 106.41], [108.0, 110.15], [110.0, 112.19], [112.0, 114.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 100.0, 0.0, 0.0, 98.44, 0.0, 0.0, 93.13, 0.0, 100.0, 96.42, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.06, -0.4, -0.28, 0.53, 0.99, 3.66, 1.71, 0.16, 0.51, 1.97, -0.1, 2.6, 2.21, 0.49, 1.68, 3.43, 1.75, 0.3, 6.35, 1.41, 2.15, 2.19, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/vj6kMfad_2E_filtered.json b/annotations_filtered/vj6kMfad_2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2c4cd136c9f0cf757793a0091eb6db9cdd1ce49 --- /dev/null +++ b/annotations_filtered/vj6kMfad_2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [9.0, 9.0], [9.0, 9.73], [12.0, 13.19], [15.0, 15.79], [16.0, 18.08], [18.0, 23.38], [29.0, 28.73], [29.0, 30.47], [40.0, 44.71], [45.0, 47.11], [49.0, 51.49], [53.0, 54.03], [56.0, 63.49], [68.0, 68.3], [70.0, 75.86], [76.0, 76.4], [77.0, 78.92], [80.0, 79.74], [86.0, 86.64], [87.0, 87.91], [94.0, 97.48], [103.0, 102.84], [103.0, 105.63], [106.0, 106.37], [107.0, 109.05], [109.0, 110.44], [113.0, 113.98], [114.0, 114.35], [117.0, 131.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 96.29, 0.0, 0.0, 94.37, 99.9, 94.07, 0.0, 89.01, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 99.95, 0.0, 94.22, 0.0, 0.0, 0.0, 61.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.0, 0.73, 1.19, 0.79, 2.08, 5.38, -0.27, 1.47, 4.71, 2.11, 2.49, 1.03, 7.49, 0.3, 5.86, 0.4, 1.92, -0.26, 0.64, 0.91, 3.48, -0.16, 2.63, 0.37, 2.05, 1.44, 0.98, 0.35, 14.19]} \ No newline at end of file diff --git a/annotations_filtered/vjDxkz5LO7A_filtered.json b/annotations_filtered/vjDxkz5LO7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9dcc632db877e3e88e7d175a533ab265436fc8c --- /dev/null +++ b/annotations_filtered/vjDxkz5LO7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.78], [9.0, 10.2], [14.0, 14.66], [16.0, 16.88], [18.0, 18.72], [19.0, 20.34], [21.0, 21.96], [23.0, 25.19], [28.0, 43.41], [46.0, 48.49], [51.0, 51.41], [53.0, 55.19], [56.0, 56.64], [58.0, 59.07], [61.0, 65.11], [71.0, 72.44], [85.0, 133.76], [136.0, 138.67], [140.0, 158.95]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.25, 57.72, 52.74, 0.0, 53.1, 0.0, 0.0, 31.26, 0.0, 0.0, 31.83, 30.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["theremin", 24.28], ["music", 21.12], ["foghorn", 17.67]], null, null, null, null, null, null, [["music", 33.21], ["sonar", 7.74], ["creak", 5.99]], null, null, [["thunk", 28.17], ["mains hum", 18.88], ["whack, thwack", 12.15]], [["music", 83.35], ["didgeridoo", 1.98], ["electronic music", 1.7]]], "duration": [-0.22, 1.2, 0.66, 0.88, 0.72, 1.34, 0.96, 2.19, 15.41, 2.49, 0.41, 2.19, 0.64, 1.07, 4.11, 1.44, 48.76, 2.67, 18.95]} \ No newline at end of file diff --git a/annotations_filtered/vjFG-4Ge668_filtered.json b/annotations_filtered/vjFG-4Ge668_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e1b6925219edf48f6d27f180a79046cd23a39dc --- /dev/null +++ b/annotations_filtered/vjFG-4Ge668_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.25], [35.0, 55.88]], "keep_status": [false, true], "silence_prob": [0.0, 35.31], "audiomae_on_audioset": [null, [["music", 30.06], ["speech", 12.8], ["hum", 4.5]]], "duration": [0.25, 20.88]} \ No newline at end of file diff --git a/annotations_filtered/vjKoaNcefSU_filtered.json b/annotations_filtered/vjKoaNcefSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9931fe8990e4fafdf65cad7abf6daa66df4636f6 --- /dev/null +++ b/annotations_filtered/vjKoaNcefSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.55], [20.0, 20.56], [23.0, 23.55], [31.0, 31.18], [35.0, 35.13], [38.0, 40.15], [41.0, 42.9], [47.0, 47.56], [51.0, 51.07], [53.0, 60.08], [71.0, 71.19], [75.0, 78.07], [81.0, 81.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 52.45, 0.0, 82.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.56, 0.55, 0.18, 0.13, 2.15, 1.9, 0.56, 0.07, 7.08, 0.19, 3.07, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/vj_NmzJ0mMA_filtered.json b/annotations_filtered/vj_NmzJ0mMA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84559c537f58b5b593df732aab6d705b07bb6f0a --- /dev/null +++ b/annotations_filtered/vj_NmzJ0mMA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 58.6], [61.0, 61.55], [62.0, 98.66], [104.0, 104.4], [105.0, 105.34], [107.0, 124.78], [125.0, 125.73]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 28.1], ["music", 24.22], ["fly, housefly", 8.58]], null], "duration": [35.6, 0.55, 36.66, 0.4, 0.34, 17.78, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/vjmHq57MZso_filtered.json b/annotations_filtered/vjmHq57MZso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f952b8528cb53b6f866ffe77a3806c84894cae8 --- /dev/null +++ b/annotations_filtered/vjmHq57MZso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [17.0, 17.52], [20.0, 20.76], [33.0, 33.44], [36.0, 37.98], [39.0, 40.02], [41.0, 41.74], [52.0, 52.24], [60.0, 68.72], [74.0, 75.03], [76.0, 78.31], [81.0, 81.58], [84.0, 84.65], [85.0, 85.77], [87.0, 87.02], [89.0, 92.91], [93.0, 93.88], [95.0, 95.49], [99.0, 99.82], [102.0, 103.2], [107.0, 107.82], [112.0, 118.57], [119.0, 121.09], [123.0, 124.12], [125.0, 126.62], [127.0, 131.36], [134.0, 136.56], [138.0, 147.24], [156.0, 156.78], [158.0, 158.11], [159.0, 159.38], [161.0, 162.85], [163.0, 165.1], [170.0, 174.24], [174.0, 176.49], [178.0, 178.55], [180.0, 180.64], [181.0, 183.24], [184.0, 185.7], [187.0, 189.5], [190.0, 191.3], [193.0, 192.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.25, 0.0, 41.72, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 72.6, 0.0, 0.0, 62.89, 52.51, 33.07, 0.0, 0.0, 0.0, 0.0, 88.46, 61.27, 70.3, 0.0, 0.0, 47.7, 0.0, 51.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 61.44], ["music", 6.57], ["boing", 3.01]], null, [["sidetone", 22.4], ["music", 20.79], ["speech", 18.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 31.34], ["music", 23.2], ["synthesizer", 10.74]], null, null, null, null, null, null, null, null, null, [["speech", 35.05], ["music", 14.25], ["ping", 4.61]], null, null, null, null], "duration": [0.8, 0.52, 0.76, 0.44, 1.98, 1.02, 0.74, 0.24, 8.72, 1.03, 2.31, 0.58, 0.65, 0.77, 0.02, 3.91, 0.88, 0.49, 0.82, 1.2, 0.82, 6.57, 2.09, 1.12, 1.62, 4.36, 2.56, 9.24, 0.78, 0.11, 0.38, 1.85, 2.1, 4.24, 2.49, 0.55, 0.64, 2.24, 1.7, 2.5, 1.3, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/vjvHNXSWvPs_filtered.json b/annotations_filtered/vjvHNXSWvPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a06d5d111f91503a51b053505c311113c705bf --- /dev/null +++ b/annotations_filtered/vjvHNXSWvPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.64], [10.0, 9.98], [11.0, 12.21], [14.0, 15.53], [17.0, 18.03], [19.0, 18.76], [20.0, 24.65], [25.0, 27.7], [29.0, 29.86], [32.0, 32.49], [33.0, 34.38], [39.0, 39.48], [43.0, 44.49], [48.0, 49.03], [50.0, 50.62], [52.0, 52.89], [60.0, 61.15], [68.0, 68.25], [70.0, 70.29], [73.0, 73.28], [73.0, 73.4], [80.0, 81.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.94, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["gong", 54.44], ["music", 12.79], ["singing bowl", 8.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.64, -0.02, 1.21, 1.53, 1.03, -0.24, 4.65, 2.7, 0.86, 0.49, 1.38, 0.48, 1.49, 1.03, 0.62, 0.89, 1.15, 0.25, 0.29, 0.28, 0.4, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/vk5Kr-zV8AE_filtered.json b/annotations_filtered/vk5Kr-zV8AE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38425bc167aa171449bb533e8fafc1e34fba0491 --- /dev/null +++ b/annotations_filtered/vk5Kr-zV8AE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [12.0, 11.84], [34.0, 34.11], [44.0, 44.83], [59.0, 59.21], [60.0, 61.23], [66.0, 66.43], [69.0, 68.81], [73.0, 73.8], [78.0, 80.32], [82.0, 83.54], [86.0, 104.75], [105.0, 106.27], [127.0, 127.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 30.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.18], ["music", 25.32], ["throbbing", 13.08]], null, null], "duration": [0.51, -0.16, 0.11, 0.83, 0.21, 1.23, 0.43, -0.19, 0.8, 2.32, 1.54, 18.75, 1.27, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/vkFKHF9Fs_s_filtered.json b/annotations_filtered/vkFKHF9Fs_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30b3f4f81f9590a38870953601dac0e35b309d2c --- /dev/null +++ b/annotations_filtered/vkFKHF9Fs_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.37], [8.0, 9.05], [10.0, 11.85], [13.0, 13.68], [14.0, 14.64], [15.0, 28.59], [32.0, 35.14], [38.0, 39.65], [40.0, 41.69], [43.0, 43.28], [44.0, 44.85], [46.0, 46.38], [47.0, 49.64], [51.0, 55.97], [57.0, 56.91], [59.0, 59.05], [60.0, 61.72], [62.0, 63.39], [66.0, 66.36], [67.0, 67.91], [69.0, 69.79], [70.0, 71.19], [72.0, 77.26], [78.0, 79.29], [81.0, 81.45], [84.0, 83.98], [85.0, 89.21], [89.0, 89.31], [89.0, 89.36], [89.0, 89.41], [89.0, 89.48], [90.0, 102.37], [103.0, 106.03], [107.0, 108.7], [109.0, 109.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.15, 0.0, 0.0, 0.0, 0.0, 79.59, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 86.64, 98.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.37, 1.05, 1.85, 0.68, 0.64, 13.59, 3.14, 1.65, 1.69, 0.28, 0.85, 0.38, 2.64, 4.97, -0.09, 0.05, 1.72, 1.39, 0.36, 0.91, 0.79, 1.19, 5.26, 1.29, 0.45, -0.02, 4.21, 0.31, 0.36, 0.41, 0.48, 12.37, 3.03, 1.7, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/vkX9jHBsmwM_filtered.json b/annotations_filtered/vkX9jHBsmwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..211188441473f005bb4d7e9330750eecefeb3b2f --- /dev/null +++ b/annotations_filtered/vkX9jHBsmwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 23.4], [26.0, 42.57], [56.0, 56.67], [59.0, 66.09], [71.0, 72.1], [73.0, 73.84], [77.0, 87.24], [103.0, 118.22]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [30.69, 31.15, 0.0, 30.86, 0.0, 0.0, 31.51, 30.81], "audiomae_on_audioset": [[["music", 79.91], ["didgeridoo", 7.49], ["throbbing", 1.63]], [["music", 78.09], ["throbbing", 10.36], ["electronic music", 2.05]], null, [["music", 52.27], ["whack, thwack", 9.64], ["smash, crash", 9.53]], null, null, [["music", 53.4], ["didgeridoo", 23.55], ["throbbing", 5.68]], [["whack, thwack", 25.97], ["music", 22.99], ["throbbing", 21.79]]], "duration": [9.4, 16.57, 0.67, 7.09, 1.1, 0.84, 10.24, 15.22]} \ No newline at end of file diff --git a/annotations_filtered/vkXY0EqahbY_filtered.json b/annotations_filtered/vkXY0EqahbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1587958981c7f41ce349836e54f65394a7347315 --- /dev/null +++ b/annotations_filtered/vkXY0EqahbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [7.0, 6.74], [10.0, 10.29], [15.0, 15.6], [19.0, 19.48], [22.0, 23.16], [25.0, 26.59], [30.0, 30.7], [33.0, 33.71], [35.0, 38.35], [42.0, 42.33], [43.0, 43.06], [47.0, 47.98], [51.0, 50.79], [51.0, 51.98], [54.0, 54.58], [57.0, 58.06], [62.0, 61.94], [63.0, 63.81], [66.0, 66.39], [67.0, 67.04], [71.0, 71.59], [74.0, 76.05], [81.0, 81.04], [84.0, 84.43], [85.0, 85.68], [87.0, 87.39], [91.0, 91.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, -0.26, 0.29, 0.6, 0.48, 1.16, 1.59, 0.7, 0.71, 3.35, 0.33, 0.06, 0.98, -0.21, 0.98, 0.58, 1.06, -0.06, 0.81, 0.39, 0.04, 0.59, 2.05, 0.04, 0.43, 0.68, 0.39, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/vkdH0nuDWX4_filtered.json b/annotations_filtered/vkdH0nuDWX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfc7297b48339714ae7230ca783dd3c6d7de5780 --- /dev/null +++ b/annotations_filtered/vkdH0nuDWX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [7.0, 7.91], [9.0, 9.24], [11.0, 11.21], [13.0, 14.39], [16.0, 17.39], [18.0, 32.43], [34.0, 36.39], [37.0, 43.01], [44.0, 45.27], [48.0, 54.04], [57.0, 62.68], [64.0, 64.93], [72.0, 72.59], [76.0, 78.41], [88.0, 88.28], [92.0, 92.03], [96.0, 97.92], [99.0, 99.6], [101.0, 101.8], [106.0, 108.18], [110.0, 110.0], [113.0, 123.65], [126.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.94, 30.8, 29.91, 0.0, 29.55, 31.99, 0.0, 0.0, 37.96, 0.0, 0.0, 0.0, 0.0, 0.0, 33.81, 0.0, 32.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 40.17], ["sidetone", 35.46], ["music", 9.36]], [["music", 65.27], ["speech", 9.47], ["musical instrument", 7.27]], [["speech", 47.21], ["music", 23.82], ["synthesizer", 8.73]], null, [["speech", 52.12], ["music", 11.04], ["mains hum", 5.04]], [["music", 22.84], ["hum", 6.23], ["vehicle", 5.83]], null, null, [["noise", 23.29], ["hum", 7.86], ["fart", 5.5]], null, null, null, null, null, [["boat, water vehicle", 11.64], ["motorboat, speedboat", 9.69], ["vehicle", 9.25]], null, [["music", 42.94], ["synthesizer", 11.85], ["musical instrument", 7.87]], null], "duration": [0.23, 0.91, 0.24, 0.21, 1.39, 1.39, 14.43, 2.39, 6.01, 1.27, 6.04, 5.68, 0.93, 0.59, 2.41, 0.28, 0.03, 1.92, 0.6, 0.8, 2.18, 0.0, 10.65, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/vkj3RBOD3cA_filtered.json b/annotations_filtered/vkj3RBOD3cA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..845f67d79676edeb64f73b02c1933aa08a77d946 --- /dev/null +++ b/annotations_filtered/vkj3RBOD3cA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.42], [31.0, 34.55], [43.0, 43.38], [48.0, 48.49], [52.0, 52.05], [58.0, 58.45], [62.0, 62.83], [65.0, 66.24], [67.0, 68.96], [71.0, 71.73], [74.0, 76.23], [79.0, 80.0], [82.0, 82.12], [84.0, 84.45], [89.0, 89.01], [91.0, 91.3], [100.0, 101.06], [105.0, 106.76], [108.0, 109.56], [111.0, 111.99], [116.0, 116.51], [120.0, 121.04], [122.0, 122.55], [125.0, 125.98], [130.0, 130.49], [131.0, 132.41], [133.0, 134.06], [138.0, 138.52], [141.0, 141.22], [142.0, 142.55], [145.0, 146.52], [149.0, 150.06], [152.0, 152.44], [153.0, 153.86], [155.0, 157.05], [159.0, 160.44], [163.0, 164.08], [165.0, 166.77], [169.0, 169.53], [176.0, 178.11], [179.0, 183.05], [186.0, 196.5], [197.0, 199.1], [200.0, 200.77], [204.0, 205.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 86.82, 99.76, 98.27, 99.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.42, 3.55, 0.38, 0.49, 0.05, 0.45, 0.83, 1.24, 1.96, 0.73, 2.23, 1.0, 0.12, 0.45, 0.01, 0.3, 1.06, 1.76, 1.56, 0.99, 0.51, 1.04, 0.55, 0.98, 0.49, 1.41, 1.06, 0.52, 0.22, 0.55, 1.52, 1.06, 0.44, 0.86, 2.05, 1.44, 1.08, 1.77, 0.53, 2.11, 4.05, 10.5, 2.1, 0.77, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/vkkM9YAJ-Ts_filtered.json b/annotations_filtered/vkkM9YAJ-Ts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe2bd2919fb0931b3b21e0dc97d39c64dea761a --- /dev/null +++ b/annotations_filtered/vkkM9YAJ-Ts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [14.0, 15.87], [18.0, 18.64], [21.0, 22.42], [27.0, 29.25], [34.0, 43.5]], "keep_status": [true, false, false, false, true, true], "silence_prob": [31.2, 0.0, 0.0, 0.0, 43.3, 34.93], "audiomae_on_audioset": [[["speech", 40.67], ["tuning fork", 11.4], ["chink, clink", 7.12]], null, null, null, [["telephone", 27.86], ["baby laughter", 14.05], ["goose", 5.9]], [["speech", 36.91], ["snicker", 16.2], ["laughter", 5.07]]], "duration": [3.76, 1.87, 0.64, 1.42, 2.25, 9.5]} \ No newline at end of file diff --git a/annotations_filtered/vkmf3Hbnh_4_filtered.json b/annotations_filtered/vkmf3Hbnh_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fddd50d52028a40b8589f310f93c6fdb8037bb3 --- /dev/null +++ b/annotations_filtered/vkmf3Hbnh_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.99], [13.0, 22.01], [24.0, 25.19], [29.0, 38.3], [40.0, 52.25], [59.0, 59.24], [60.0, 83.78], [85.0, 84.94], [85.0, 85.45], [85.0, 115.6], [117.0, 121.0], [141.0, 141.25]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [38.58, 34.99, 0.0, 32.63, 31.56, 0.0, 31.2, 0.0, 0.0, 0.0, 32.14, 0.0], "audiomae_on_audioset": [[["music", 48.44], ["synthesizer", 9.4], ["theremin", 4.15]], [["music", 47.99], ["musical instrument", 8.5], ["speech", 7.96]], null, [["music", 34.17], ["boing", 22.9], ["speech", 8.35]], [["music", 17.78], ["speech", 8.64], ["foghorn", 7.6]], null, [["music", 67.85], ["cacophony", 6.42], ["musical instrument", 2.2]], null, null, null, [["music", 51.47], ["theremin", 20.63], ["musical instrument", 4.11]], null], "duration": [3.99, 9.01, 1.19, 9.3, 12.25, 0.24, 23.78, -0.06, 0.45, 30.6, 4.0, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/vkoJH4fum58_filtered.json b/annotations_filtered/vkoJH4fum58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a9725eb12ef36f1e1e55dc0a78eef963f3fc590 --- /dev/null +++ b/annotations_filtered/vkoJH4fum58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.73], [33.0, 32.7], [34.0, 35.41], [38.0, 38.62], [39.0, 40.15], [52.0, 53.91], [55.0, 55.24], [61.0, 61.65], [62.0, 62.8], [64.0, 64.56], [83.0, 83.22], [83.0, 83.44], [88.0, 89.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, -0.3, 1.41, 0.62, 1.15, 1.91, 0.24, 0.65, 0.8, 0.56, 0.22, 0.44, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/vl5LaKMkhYw_filtered.json b/annotations_filtered/vl5LaKMkhYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e57e4ef455a00bab97856cbfc2f9611937f68e1 --- /dev/null +++ b/annotations_filtered/vl5LaKMkhYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.02], [6.0, 6.74], [9.0, 9.75], [11.0, 12.07], [13.0, 14.76], [17.0, 17.78], [19.0, 20.14], [21.0, 21.68], [22.0, 23.19], [24.0, 24.73], [26.0, 27.87], [29.0, 31.95], [33.0, 44.37], [50.0, 49.77], [51.0, 51.68], [52.0, 53.92], [54.0, 56.79], [59.0, 59.54], [60.0, 61.65], [65.0, 67.05], [67.0, 73.47], [74.0, 74.16], [76.0, 77.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 100.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.02, 0.74, 0.75, 1.07, 1.76, 0.78, 1.14, 0.68, 1.19, 0.73, 1.87, 2.95, 11.37, -0.23, 0.68, 1.92, 2.79, 0.54, 1.65, 2.05, 6.47, 0.16, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/vlK8CMKzWUY_filtered.json b/annotations_filtered/vlK8CMKzWUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e8e2037b940caa5e3ea08b7a69cd1911ce2dc29 --- /dev/null +++ b/annotations_filtered/vlK8CMKzWUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.85], [13.0, 13.32], [14.0, 14.67], [18.0, 19.08], [21.0, 21.42], [23.0, 24.7], [26.0, 27.24], [34.0, 33.89], [37.0, 37.12], [43.0, 43.92], [51.0, 52.24], [61.0, 62.95], [64.0, 65.13], [66.0, 71.29], [81.0, 83.51], [85.0, 88.43], [90.0, 90.41], [92.0, 91.98], [95.0, 95.98], [100.0, 101.78], [103.0, 104.19], [106.0, 107.0], [108.0, 108.18], [109.0, 109.56], [114.0, 115.86], [117.0, 118.74], [120.0, 122.76], [127.0, 127.72], [129.0, 130.15], [132.0, 133.03], [138.0, 139.45], [143.0, 143.38], [144.0, 145.5], [146.0, 146.75], [155.0, 156.42], [166.0, 167.21], [169.0, 169.08], [169.0, 170.94], [172.0, 173.33], [175.0, 176.54], [178.0, 177.94], [178.0, 178.02], [178.0, 178.09], [180.0, 182.44], [184.0, 185.25], [187.0, 194.7], [196.0, 196.89]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.75, 32.3, 38.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.79, 0.0, 39.09, 0.0], "audiomae_on_audioset": [[["clapping", 30.81], ["hands", 11.65], ["tap", 11.64]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.51], ["hum", 18.69], ["mains hum", 10.64]], [["speech", 23.44], ["didgeridoo", 17.68], ["music", 16.56]], [["music", 46.31], ["synthesizer", 25.45], ["hum", 6.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.53], ["thunk", 13.11], ["flamenco", 4.28]], null, [["music", 74.5], ["synthesizer", 6.48], ["musical instrument", 3.14]], null], "duration": [2.85, 0.32, 0.67, 1.08, 0.42, 1.7, 1.24, -0.11, 0.12, 0.92, 1.24, 1.95, 1.13, 5.29, 2.51, 3.43, 0.41, -0.02, 0.98, 1.78, 1.19, 1.0, 0.18, 0.56, 1.86, 1.74, 2.76, 0.72, 1.15, 1.03, 1.45, 0.38, 1.5, 0.75, 1.42, 1.21, 0.08, 1.94, 1.33, 1.54, -0.06, 0.02, 0.09, 2.44, 1.25, 7.7, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/vlZQj4OrTUM_filtered.json b/annotations_filtered/vlZQj4OrTUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..615b5dca9f9c1e193d9cf87e3589ba3ce360630a --- /dev/null +++ b/annotations_filtered/vlZQj4OrTUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [13.0, 19.75], [21.0, 22.25], [26.0, 26.96], [29.0, 34.18], [36.0, 37.57], [40.0, 41.4], [44.0, 46.14], [48.0, 50.8], [55.0, 54.85], [56.0, 56.78], [58.0, 58.94], [67.0, 67.44], [71.0, 71.22], [74.0, 75.46], [79.0, 79.89], [90.0, 89.94], [93.0, 95.42], [99.0, 103.94], [105.0, 106.91], [108.0, 109.44], [111.0, 112.78], [115.0, 117.39], [119.0, 123.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.87, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 6.75, 1.25, 0.96, 5.18, 1.57, 1.4, 2.14, 2.8, -0.15, 0.78, 0.94, 0.44, 0.22, 1.46, 0.89, -0.06, 2.42, 4.94, 1.91, 1.44, 1.78, 2.39, 4.72]} \ No newline at end of file diff --git a/annotations_filtered/vlg5VPKbGQg_filtered.json b/annotations_filtered/vlg5VPKbGQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31f2bdacc87c5296609124434428801dcb7012ae --- /dev/null +++ b/annotations_filtered/vlg5VPKbGQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [6.0, 7.91], [9.0, 13.07], [14.0, 14.49], [15.0, 20.44], [22.0, 23.16], [24.0, 34.8], [36.0, 39.9], [42.0, 44.46], [46.0, 47.65], [49.0, 52.35], [54.0, 54.63], [57.0, 59.71], [61.0, 62.95], [66.0, 69.87], [71.0, 79.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 93.45, 0.0, 99.62, 0.0, 87.74, 98.51, 100.0, 0.0, 99.97, 0.0, 90.78, 0.0, 99.92, 70.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.91, 4.07, 0.49, 5.44, 1.16, 10.8, 3.9, 2.46, 1.65, 3.35, 0.63, 2.71, 1.95, 3.87, 8.88]} \ No newline at end of file diff --git a/annotations_filtered/vlqQwxeYtr8_filtered.json b/annotations_filtered/vlqQwxeYtr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..205e9d5eb655a4a8f96e6a2ae5ae535cc69432e4 --- /dev/null +++ b/annotations_filtered/vlqQwxeYtr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.25], [17.0, 20.83], [22.0, 24.0], [26.0, 29.76], [30.0, 31.92], [34.0, 37.23], [38.0, 41.72], [43.0, 46.43], [47.0, 50.25], [52.0, 63.21], [65.0, 66.06], [67.0, 67.78], [78.0, 79.14], [79.0, 86.58], [87.0, 90.09], [91.0, 91.66], [93.0, 99.76], [101.0, 101.75], [103.0, 104.65], [108.0, 107.89], [114.0, 114.91], [119.0, 124.26]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.71, 100.0, 100.0, 100.0, 0.0, 75.07, 82.25, 100.0, 84.43, 44.49, 0.0, 0.0, 0.0, 94.22, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["insect", 33.88], ["fly, housefly", 11.96], ["cattle, bovinae", 8.13]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.25, 3.83, 2.0, 3.76, 1.92, 3.23, 3.72, 3.43, 3.25, 11.21, 1.06, 0.78, 1.14, 7.58, 3.09, 0.66, 6.76, 0.75, 1.65, -0.11, 0.91, 5.26]} \ No newline at end of file diff --git a/annotations_filtered/vm-rgqRKqz8_filtered.json b/annotations_filtered/vm-rgqRKqz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b87a35a70f4ac7550a7c2c4f00505d299ae470 --- /dev/null +++ b/annotations_filtered/vm-rgqRKqz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.16], [8.0, 19.57], [25.0, 25.3], [31.0, 32.1], [33.0, 49.08], [51.0, 52.54], [60.0, 60.1], [65.0, 66.31], [68.0, 69.31], [70.0, 71.61], [72.0, 73.72], [75.0, 75.12], [78.0, 80.05], [85.0, 86.41], [87.0, 87.17], [88.0, 92.85], [94.0, 110.96], [113.0, 115.13], [121.0, 125.19]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [88.64, 57.09, 0.0, 0.0, 48.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 48.39, 50.11, 34.08, 40.28], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 23.3], ["hum", 20.23], ["music", 10.58]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.92], ["sidetone", 18.95], ["bee, wasp, etc.", 13.74]], null, [["cattle, bovinae", 18.52], ["wild animals", 17.1], ["animal", 16.74]], [["music", 59.37], ["theremin", 7.48], ["didgeridoo", 4.18]]], "duration": [2.16, 11.57, 0.3, 1.1, 16.08, 1.54, 0.1, 1.31, 1.31, 1.61, 1.72, 0.12, 2.05, 1.41, 0.17, 4.85, 16.96, 2.13, 4.19]} \ No newline at end of file diff --git a/annotations_filtered/vm8sOhr-0lA_filtered.json b/annotations_filtered/vm8sOhr-0lA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c4de89c1539831ffd4134b0eb0018838ea67d0b --- /dev/null +++ b/annotations_filtered/vm8sOhr-0lA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [8.0, 9.61], [13.0, 16.87], [23.0, 24.95], [27.0, 27.51], [34.0, 35.9], [41.0, 42.55], [43.0, 48.37], [52.0, 54.31], [56.0, 58.41], [62.0, 62.29], [65.0, 71.22], [77.0, 97.11], [108.0, 111.45], [113.0, 114.25], [118.0, 121.24]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 0.0, 30.04, 36.33, 33.74, 0.0, 30.06, 31.69, 33.82, 0.0, 65.79], "audiomae_on_audioset": [null, null, [["speech", 39.41], ["music", 22.08], ["eruption", 7.82]], null, null, null, null, [["music", 69.28], ["synthesizer", 8.09], ["theremin", 4.08]], [["music", 77.0], ["throbbing", 3.63], ["hum", 3.55]], [["music", 79.45], ["synthesizer", 2.69], ["throbbing", 2.2]], null, [["music", 41.55], ["hum", 18.24], ["throbbing", 13.0]], [["music", 25.04], ["hum", 24.28], ["throbbing", 15.44]], [["music", 42.96], ["sonar", 9.65], ["synthesizer", 9.46]], null, null], "duration": [0.57, 1.61, 3.87, 1.95, 0.51, 1.9, 1.55, 5.37, 2.31, 2.41, 0.29, 6.22, 20.11, 3.45, 1.25, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/vmOBZjVBCUo_filtered.json b/annotations_filtered/vmOBZjVBCUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d69e83b3a82a800b77bc91d555ef3492656a804 --- /dev/null +++ b/annotations_filtered/vmOBZjVBCUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 52.69], [54.0, 57.52], [58.0, 60.05], [62.0, 70.33], [75.0, 78.83], [81.0, 81.65], [82.0, 82.63], [87.0, 86.95], [87.0, 87.76], [89.0, 101.83]], "keep_status": [true, false, true, true, false, false, false, false, false, false], "silence_prob": [37.54, 38.78, 35.54, 37.23, 40.48, 0.0, 0.0, 0.0, 0.0, 29.46], "audiomae_on_audioset": [[["speech", 48.22], ["crushing", 5.25], ["music", 4.87]], [["music", 58.88], ["throbbing", 7.33], ["electronic music", 6.94]], [["throbbing", 27.5], ["music", 17.2], ["hum", 12.39]], [["glass", 16.65], ["hum", 11.6], ["throbbing", 9.84]], [["cattle, bovinae", 47.27], ["moo", 17.84], ["livestock, farm animals, working animals", 14.85]], null, null, null, null, [["music", 79.67], ["hum", 3.53], ["throbbing", 2.41]]], "duration": [3.69, 3.52, 2.05, 8.33, 3.83, 0.65, 0.63, -0.05, 0.76, 12.83]} \ No newline at end of file diff --git a/annotations_filtered/vmWm02fUJ-o_filtered.json b/annotations_filtered/vmWm02fUJ-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..411fec309ed9b1034e1baa532269b73e77122698 --- /dev/null +++ b/annotations_filtered/vmWm02fUJ-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 27.62], [33.0, 37.4], [38.0, 42.63], [44.0, 43.97], [45.0, 46.23], [48.0, 52.35], [55.0, 60.54], [64.0, 92.6], [94.0, 95.1], [97.0, 101.46], [102.0, 106.05], [106.0, 107.06], [110.0, 114.88], [116.0, 119.52], [122.0, 123.58], [124.0, 124.06], [125.0, 126.57], [127.0, 127.5], [129.0, 132.66], [133.0, 134.37], [135.0, 135.78], [143.0, 143.63], [148.0, 148.14], [150.0, 155.24], [156.0, 156.44], [160.0, 160.57], [162.0, 163.46], [165.0, 165.43], [168.0, 168.72], [172.0, 174.51], [176.0, 178.17], [180.0, 183.17], [185.0, 186.88], [188.0, 189.24], [192.0, 195.57], [199.0, 207.1], [207.0, 207.18]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [37.92, 33.02, 38.71, 0.0, 0.0, 34.59, 33.94, 31.44, 0.0, 34.72, 36.44, 0.0, 34.37, 43.93, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 43.4, 41.09, 0.0, 0.0, 34.53, 31.5, 0.0], "audiomae_on_audioset": [[["fly, housefly", 58.83], ["insect", 32.73], ["bee, wasp, etc.", 6.91]], [["fly, housefly", 47.65], ["insect", 38.62], ["bee, wasp, etc.", 10.49]], [["speech", 46.93], ["telephone", 7.72], ["radio", 6.57]], null, null, [["noise", 15.41], ["speech", 10.43], ["music", 9.99]], [["fly, housefly", 58.24], ["insect", 19.67], ["bee, wasp, etc.", 17.42]], [["whale vocalization", 33.9], ["noise", 19.25], ["music", 5.63]], null, [["fly, housefly", 45.7], ["insect", 19.26], ["sidetone", 8.17]], [["fly, housefly", 49.76], ["insect", 26.43], ["bee, wasp, etc.", 14.56]], null, [["music", 30.05], ["didgeridoo", 10.28], ["speech", 6.47]], [["fly, housefly", 36.06], ["insect", 26.62], ["bee, wasp, etc.", 13.8]], null, null, null, null, null, null, null, null, null, [["speech", 52.97], ["radio", 20.76], ["frog", 8.18]], null, null, null, null, null, null, [["music", 17.64], ["hum", 10.3], ["mains hum", 8.73]], [["music", 12.47], ["effects unit", 10.97], ["synthesizer", 10.52]], null, null, [["speech", 42.25], ["music", 19.56], ["beatboxing", 4.86]], [["music", 46.08], ["didgeridoo", 14.85], ["frog", 10.92]], null], "duration": [3.62, 4.4, 4.63, -0.03, 1.23, 4.35, 5.54, 28.6, 1.1, 4.46, 4.05, 1.06, 4.88, 3.52, 1.58, 0.06, 1.57, 0.5, 3.66, 1.37, 0.78, 0.63, 0.14, 5.24, 0.44, 0.57, 1.46, 0.43, 0.72, 2.51, 2.17, 3.17, 1.88, 1.24, 3.57, 8.1, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/vmm8P0V1W4g_filtered.json b/annotations_filtered/vmm8P0V1W4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d96fafed457561c2b012c7bd4632ff5d16496244 --- /dev/null +++ b/annotations_filtered/vmm8P0V1W4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.06], [4.0, 5.02], [6.0, 6.56], [8.0, 32.39], [32.0, 32.53], [33.0, 38.62], [41.0, 73.13], [76.0, 94.24], [94.0, 94.27], [96.0, 120.38], [122.0, 124.07], [125.0, 133.95], [135.0, 155.33], [159.0, 165.48], [168.0, 171.68], [175.0, 176.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 32.08, 0.0, 31.53, 0.0, 31.63, 0.0, 34.09, 65.67, 31.42, 31.2, 32.56, 30.88, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 52.29], ["music", 38.24], ["fireworks", 1.35]], null, [["music", 61.5], ["throbbing", 15.0], ["hum", 5.03]], null, [["music", 28.34], ["throbbing", 18.83], ["whack, thwack", 9.45]], null, [["music", 44.66], ["throbbing", 15.76], ["hum", 10.76]], null, [["speech", 80.95], ["music", 8.02], ["sidetone", 1.34]], [["speech", 58.25], ["music", 27.27], ["cacophony", 2.05]], [["music", 28.91], ["throbbing", 7.44], ["cacophony", 6.75]], [["music", 21.92], ["theremin", 12.57], ["noise", 11.42]], null], "duration": [0.06, 1.02, 0.56, 24.39, 0.53, 5.62, 32.13, 18.24, 0.27, 24.38, 2.07, 8.95, 20.33, 6.48, 3.68, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/vmynulColPI_filtered.json b/annotations_filtered/vmynulColPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0f0e53cb47905ce32c473e67097a1802ff3b7a --- /dev/null +++ b/annotations_filtered/vmynulColPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.9], [11.0, 12.93], [13.0, 14.39], [15.0, 16.06], [26.0, 26.28], [28.0, 32.19], [35.0, 35.72], [45.0, 45.28], [45.0, 51.21], [52.0, 63.8], [69.0, 68.69], [71.0, 71.39], [77.0, 77.5], [79.0, 79.83], [83.0, 83.51], [86.0, 86.43], [107.0, 107.18], [117.0, 120.51], [121.0, 121.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [63.42, 0.0, 0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 29.41, 29.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 82.4], ["music", 4.37], ["outside, rural or natural", 1.88]], null, null, [["music", 41.99], ["speech", 23.43], ["explosion", 5.71]], [["whack, thwack", 30.53], ["breaking", 7.57], ["livestock, farm animals, working animals", 7.44]], null, null, null, null, null, null, null, [["mains hum", 38.87], ["hum", 32.14], ["music", 15.75]], null], "duration": [3.9, 1.93, 1.39, 1.06, 0.28, 4.19, 0.72, 0.28, 6.21, 11.8, -0.31, 0.39, 0.5, 0.83, 0.51, 0.43, 0.18, 3.51, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/vn-PJRh_nFQ_filtered.json b/annotations_filtered/vn-PJRh_nFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9641036da505392d0609160eb5df7fc3550fa13 --- /dev/null +++ b/annotations_filtered/vn-PJRh_nFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.64], [11.0, 11.55], [20.0, 25.12], [30.0, 30.48], [34.0, 35.77], [39.0, 43.56], [47.0, 53.7], [64.0, 99.1], [100.0, 106.34], [110.0, 111.21], [114.0, 115.33], [117.0, 118.64], [120.0, 122.69], [125.0, 125.74], [127.0, 129.19], [130.0, 132.0], [133.0, 133.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.22, 0.0, 34.04, 0.0, 0.0, 94.66, 37.98, 0.0, 83.7, 0.0, 0.0, 0.0, 99.92, 0.0, 100.0, 96.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.73], ["boing", 8.66], ["pizzicato", 4.6]], null, null, null, [["music", 74.6], ["musical instrument", 3.38], ["keyboard (musical)", 2.46]], null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.55, 5.12, 0.48, 1.77, 4.56, 6.7, 35.1, 6.34, 1.21, 1.33, 1.64, 2.69, 0.74, 2.19, 2.0, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/vn6qlQGDOIo_filtered.json b/annotations_filtered/vn6qlQGDOIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d8dad5c71801fa46f9aa8673cf1cd5b28e8f70 --- /dev/null +++ b/annotations_filtered/vn6qlQGDOIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.97], [8.0, 8.61], [10.0, 12.93], [13.0, 14.5], [16.0, 20.53], [21.0, 27.33], [29.0, 30.82], [31.0, 31.4], [42.0, 44.46], [46.0, 47.38], [49.0, 49.92], [50.0, 51.51], [53.0, 54.23], [55.0, 59.91], [61.0, 64.69], [67.0, 67.12], [69.0, 68.82], [69.0, 71.41], [72.0, 74.82], [76.0, 81.01], [82.0, 83.39], [85.0, 88.32], [89.0, 90.56], [93.0, 93.46], [94.0, 97.04], [98.0, 101.14], [101.0, 104.31], [106.0, 108.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 51.82, 0.0, 83.16, 58.72, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 86.64, 75.07, 0.0, 0.0, 32.22, 61.87, 68.15, 0.0, 73.67, 0.0, 0.0, 74.44, 78.21, 60.42, 48.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.05], ["hum", 13.61], ["buzz", 2.58]], null, null, null, null, null, null, null, null, null, [["hum", 29.49], ["mains hum", 27.6], ["music", 5.34]]], "duration": [-0.03, 0.61, 2.93, 1.5, 4.53, 6.33, 1.82, 0.4, 2.46, 1.38, 0.92, 1.51, 1.23, 4.91, 3.69, 0.12, -0.18, 2.41, 2.82, 5.01, 1.39, 3.32, 1.56, 0.46, 3.04, 3.14, 3.31, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/vn8YIDxEGrw_filtered.json b/annotations_filtered/vn8YIDxEGrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d7867edaf1ff151f1e1f0e4f4b5c3889f34963b --- /dev/null +++ b/annotations_filtered/vn8YIDxEGrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.52], [15.0, 16.34], [18.0, 19.03], [19.0, 21.47], [23.0, 23.33], [24.0, 43.65], [47.0, 54.65], [56.0, 56.66], [57.0, 58.41], [59.0, 59.88], [60.0, 60.61], [61.0, 62.26], [63.0, 84.21], [85.0, 85.33], [87.0, 87.05], [87.0, 98.79], [99.0, 100.31], [101.0, 101.71], [102.0, 101.95], [102.0, 105.97], [108.0, 128.29], [129.0, 129.81], [130.0, 136.07], [137.0, 141.96], [143.0, 146.67], [148.0, 163.61], [164.0, 165.0], [166.0, 177.47], [178.0, 180.77], [184.0, 195.34]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 36.72, 0.0, 32.77, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 0.0, 33.05, 0.0, 0.0, 0.0, 36.63, 41.72, 0.0, 40.73, 63.21, 58.22, 48.23, 0.0, 33.63, 42.51, 35.42], "audiomae_on_audioset": [null, null, null, [["moo", 15.19], ["cattle, bovinae", 14.27], ["speech", 10.06]], null, [["explosion", 16.94], ["speech", 13.74], ["boom", 10.96]], [["hum", 34.78], ["rumble", 34.09], ["mains hum", 7.51]], null, null, null, null, null, [["music", 27.62], ["whale vocalization", 7.05], ["buzz", 6.36]], null, null, [["whack, thwack", 20.4], ["music", 16.11], ["hum", 11.14]], null, null, null, [["speech", 41.28], ["whale vocalization", 21.81], ["music", 11.16]], [["singing bowl", 29.16], ["speech", 26.53], ["rumble", 12.67]], null, [["hum", 36.16], ["mains hum", 30.72], ["speech", 14.24]], null, null, [["music", 62.6], ["electronic music", 4.78], ["hum", 4.36]], null, [["speech", 49.93], ["mains hum", 11.85], ["hum", 9.77]], [["hiccup", 21.18], ["rumble", 19.71], ["heart sounds, heartbeat", 5.76]], [["didgeridoo", 50.22], ["music", 20.86], ["speech", 11.08]]], "duration": [1.52, 1.34, 1.03, 2.47, 0.33, 19.65, 7.65, 0.66, 1.41, 0.88, 0.61, 1.26, 21.21, 0.33, 0.05, 11.79, 1.31, 0.71, -0.05, 3.97, 20.29, 0.81, 6.07, 4.96, 3.67, 15.61, 1.0, 11.47, 2.77, 11.34]} \ No newline at end of file diff --git a/annotations_filtered/vn9awsg8BjA_filtered.json b/annotations_filtered/vn9awsg8BjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9afd8aac5461ff8fcb118a21d93be111f60a28e --- /dev/null +++ b/annotations_filtered/vn9awsg8BjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.84], [16.0, 20.24], [21.0, 32.0], [35.0, 37.29], [41.0, 50.26], [52.0, 54.19], [59.0, 59.24], [60.0, 73.79], [77.0, 139.8], [141.0, 147.46], [148.0, 153.33], [157.0, 157.18], [158.0, 158.94], [159.0, 159.87], [162.0, 163.71], [165.0, 172.39], [173.0, 177.35]], "keep_status": [false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.44, 40.86, 38.42, 35.49, 38.8, 0.0, 33.37, 0.0, 63.53, 46.86, 0.0, 0.0, 0.0, 0.0, 79.41, 61.67], "audiomae_on_audioset": [null, [["music", 54.46], ["musical instrument", 4.85], ["synthesizer", 3.28]], [["music", 79.59], ["didgeridoo", 5.33], ["synthesizer", 3.91]], [["music", 68.05], ["synthesizer", 8.84], ["throbbing", 3.08]], [["music", 24.58], ["synthesizer", 23.61], ["throbbing", 14.08]], [["music", 41.25], ["throbbing", 17.78], ["speech", 6.13]], null, [["music", 48.86], ["synthesizer", 29.72], ["sampler", 4.28]], null, null, [["speech", 41.54], ["music", 23.81], ["hum", 8.69]], null, null, null, null, null, null], "duration": [-0.16, 4.24, 11.0, 2.29, 9.26, 2.19, 0.24, 13.79, 62.8, 6.46, 5.33, 0.18, 0.94, 0.87, 1.71, 7.39, 4.35]} \ No newline at end of file diff --git a/annotations_filtered/vnL8uiqp6_k_filtered.json b/annotations_filtered/vnL8uiqp6_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a86830ef2105ebe0d143296307e94209cc08b797 --- /dev/null +++ b/annotations_filtered/vnL8uiqp6_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [1.0, 1.12], [5.0, 6.12], [8.0, 8.09], [10.0, 10.91], [14.0, 20.36], [22.0, 23.23], [27.0, 28.54], [30.0, 31.78], [34.0, 43.21], [45.0, 48.91], [50.0, 51.0], [51.0, 52.0], [54.0, 57.72], [61.0, 66.77], [69.0, 72.37], [75.0, 79.73], [81.0, 80.86], [83.0, 91.05], [94.0, 112.45], [119.0, 125.78], [133.0, 134.69], [137.0, 139.31], [144.0, 144.91], [146.0, 148.66], [150.0, 157.86], [161.0, 162.11], [163.0, 165.84]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true, false, true, true, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 0.0, 0.0, 0.0, 42.79, 45.72, 0.0, 0.0, 53.53, 52.05, 72.31, 49.36, 0.0, 48.14, 34.42, 31.18, 0.0, 43.87, 0.0, 41.89, 37.72, 0.0, 33.35], "audiomae_on_audioset": [null, null, null, null, null, [["music", 9.58], ["baby cry, infant cry", 8.55], ["speech", 7.37]], null, null, null, [["whimper", 19.95], ["baby cry, infant cry", 16.23], ["grunt", 9.75]], [["music", 32.48], ["baby cry, infant cry", 9.56], ["groan", 3.88]], null, null, null, null, null, [["cattle, bovinae", 12.48], ["moo", 11.88], ["livestock, farm animals, working animals", 11.47]], null, [["speech", 48.83], ["music", 16.66], ["crying, sobbing", 3.33]], [["music", 17.14], ["explosion", 12.76], ["artillery fire", 10.62]], [["music", 68.03], ["scary music", 5.89], ["soundtrack music", 4.48]], null, [["music", 58.14], ["singing bowl", 4.17], ["didgeridoo", 4.07]], null, [["music", 18.77], ["hum", 18.75], ["mains hum", 15.88]], [["music", 58.92], ["grunt", 17.26], ["groan", 2.98]], null, [["music", 30.43], ["fly, housefly", 6.81], ["whale vocalization", 6.26]]], "duration": [1.0, 0.12, 1.12, 0.09, 0.91, 6.36, 1.23, 1.54, 1.78, 9.21, 3.91, 1.0, 1.0, 3.72, 5.77, 3.37, 4.73, -0.14, 8.05, 18.45, 6.78, 1.69, 2.31, 0.91, 2.66, 7.86, 1.11, 2.84]} \ No newline at end of file diff --git a/annotations_filtered/vnQ9yD_IIwo_filtered.json b/annotations_filtered/vnQ9yD_IIwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36fddf0a780f818f861d38bf18737eb1a866abbb --- /dev/null +++ b/annotations_filtered/vnQ9yD_IIwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [9.0, 13.85], [18.0, 19.2], [21.0, 22.91], [25.0, 31.33], [34.0, 41.99], [49.0, 76.25], [77.0, 77.85], [78.0, 80.25], [81.0, 82.8], [84.0, 86.26], [88.0, 89.94], [94.0, 104.82], [106.0, 108.01]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.52, 0.0, 0.0, 99.96, 39.33, 37.33, 0.0, 59.15, 0.0, 76.53, 0.0, 61.37, 70.16], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 61.55], ["sidetone", 6.94], ["hum", 3.08]], [["rain on surface", 14.16], ["eruption", 13.98], ["static", 13.58]], null, null, null, null, null, null, null], "duration": [0.72, 4.85, 1.2, 1.91, 6.33, 7.99, 27.25, 0.85, 2.25, 1.8, 2.26, 1.94, 10.82, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/vndiMloYcYU_filtered.json b/annotations_filtered/vndiMloYcYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02ccfc29f4f1f285356491126394446b89bb15de --- /dev/null +++ b/annotations_filtered/vndiMloYcYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [5.0, 6.05], [8.0, 9.05], [9.0, 10.05], [11.0, 15.74], [20.0, 21.14], [25.0, 25.59], [27.0, 28.59], [30.0, 30.81], [32.0, 34.35], [35.0, 40.31], [42.0, 42.55], [44.0, 45.13], [46.0, 46.08], [46.0, 47.71], [48.0, 50.28], [51.0, 55.68], [56.0, 57.03], [58.0, 59.46], [63.0, 84.13], [85.0, 86.44], [91.0, 96.7], [97.0, 99.22], [102.0, 101.85], [110.0, 110.37], [113.0, 118.45], [121.0, 122.52], [128.0, 128.61], [132.0, 132.41], [148.0, 150.13], [152.0, 156.2], [157.0, 157.76], [160.0, 160.69], [166.0, 168.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.01, 0.0, 0.0, 0.0, 0.0, 40.68, 44.72, 0.0, 0.0, 0.0, 0.0, 44.26, 71.0, 0.0, 0.0, 44.46, 0.0, 48.31, 48.1, 0.0, 0.0, 39.7, 0.0, 0.0, 0.0, 77.7, 51.44, 0.0, 0.0, 50.36], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 80.33], ["animal", 2.81], ["roaring cats (lions, tigers)", 2.59]], null, null, null, null, [["speech", 42.55], ["music", 10.28], ["inside, small room", 2.88]], [["livestock, farm animals, working animals", 36.45], ["cattle, bovinae", 32.25], ["moo", 21.83]], null, null, null, null, [["speech", 75.14], ["inside, small room", 2.07], ["hum", 1.88]], null, null, null, [["coin (dropping)", 44.28], ["speech", 31.64], ["glass", 2.11]], null, [["speech", 72.68], ["music", 4.29], ["radio", 3.25]], [["fart", 18.25], ["speech", 13.31], ["music", 4.99]], null, null, [["fly, housefly", 31.85], ["mosquito", 24.97], ["speech", 11.07]], null, null, null, null, null, null, null, null], "duration": [1.38, 1.05, 1.05, 1.05, 4.74, 1.14, 0.59, 1.59, 0.81, 2.35, 5.31, 0.55, 1.13, 0.08, 1.71, 2.28, 4.68, 1.03, 1.46, 21.13, 1.44, 5.7, 2.22, -0.15, 0.37, 5.45, 1.52, 0.61, 0.41, 2.13, 4.2, 0.76, 0.69, 2.54]} \ No newline at end of file diff --git a/annotations_filtered/vnh7gxa0z4Q_filtered.json b/annotations_filtered/vnh7gxa0z4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..836402df4bc0c5c39184851167e57f2df8344b92 --- /dev/null +++ b/annotations_filtered/vnh7gxa0z4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.98], [11.0, 11.8], [33.0, 34.74], [35.0, 36.9], [39.0, 39.7], [41.0, 41.42], [66.0, 68.86], [75.0, 74.95], [77.0, 78.71], [79.0, 80.33], [84.0, 84.52], [85.0, 90.37], [96.0, 96.5], [98.0, 98.98], [102.0, 103.69], [104.0, 110.69], [112.0, 122.5], [126.0, 126.3], [128.0, 128.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 29.97, 0.0, 0.0, 0.0, 29.74, 29.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.41], ["music", 20.06], ["vehicle", 12.18]], null, null, null, [["speech", 26.49], ["sidetone", 11.26], ["hum", 10.31]], [["speech", 69.58], ["music", 6.07], ["explosion", 1.71]], null, null], "duration": [-0.02, 0.8, 1.74, 1.9, 0.7, 0.42, 2.86, -0.05, 1.71, 1.33, 0.52, 5.37, 0.5, 0.98, 1.69, 6.69, 10.5, 0.3, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/vo0cUbT4Lh4_filtered.json b/annotations_filtered/vo0cUbT4Lh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..304af0c9cdf064d5f73ea3be6da43a0528e1f727 --- /dev/null +++ b/annotations_filtered/vo0cUbT4Lh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.82], [14.0, 14.18], [16.0, 16.9], [20.0, 20.17], [24.0, 24.88], [41.0, 41.4], [43.0, 44.9], [47.0, 48.96], [51.0, 51.29]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.82, 0.18, 0.9, 0.17, 0.88, 0.4, 1.9, 1.96, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/voNs3aHZmQM_filtered.json b/annotations_filtered/voNs3aHZmQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a29166513a4c51205373a1104901ca98424e219 --- /dev/null +++ b/annotations_filtered/voNs3aHZmQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.48], [8.0, 9.44], [10.0, 12.06], [18.0, 19.82], [22.0, 22.59], [23.0, 24.19], [25.0, 26.1], [28.0, 28.86], [30.0, 31.38], [36.0, 39.83], [41.0, 43.07], [46.0, 46.45], [48.0, 48.95], [53.0, 55.14], [58.0, 58.13], [59.0, 60.49], [62.0, 62.83], [63.0, 64.99], [70.0, 69.87], [73.0, 73.45], [75.0, 76.27], [77.0, 79.05], [81.0, 83.27], [87.0, 89.19], [94.0, 94.9], [96.0, 96.72], [98.0, 99.76], [101.0, 101.41], [102.0, 104.03], [104.0, 105.33], [106.0, 108.24], [109.0, 114.71], [116.0, 115.94]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, true, false, false], "silence_prob": [45.49, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.29, 38.35, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.33, 40.57, 38.88, 0.0, 0.0, 0.0, 0.0, 38.38, 0.0, 35.4, 34.93, 0.0], "audiomae_on_audioset": [[["music", 19.06], ["speech", 16.08], ["animal", 6.32]], null, [["music", 42.84], ["musical instrument", 6.13], ["speech", 4.92]], null, null, null, null, null, null, [["speech", 48.11], ["music", 6.28], ["cattle, bovinae", 5.74]], [["speech", 29.27], ["vehicle", 7.32], ["music", 6.62]], null, null, null, null, null, null, null, null, null, null, [["music", 56.7], ["speech", 4.48], ["theremin", 3.38]], [["speech", 20.81], ["whale vocalization", 20.35], ["music", 7.66]], [["music", 36.94], ["theremin", 12.95], ["speech", 6.36]], null, null, null, null, [["music", 31.48], ["whale vocalization", 15.35], ["theremin", 14.87]], null, [["music", 46.44], ["speech", 4.63], ["theremin", 3.51]], [["theremin", 48.0], ["music", 30.2], ["musical instrument", 2.52]], null], "duration": [3.48, 1.44, 2.06, 1.82, 0.59, 1.19, 1.1, 0.86, 1.38, 3.83, 2.07, 0.45, 0.95, 2.14, 0.13, 1.49, 0.83, 1.99, -0.13, 0.45, 1.27, 2.05, 2.27, 2.19, 0.9, 0.72, 1.76, 0.41, 2.03, 1.33, 2.24, 5.71, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/voYRf2GVXbc_filtered.json b/annotations_filtered/voYRf2GVXbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e65ffa1c35ba061b2aabb57b0f6dcb75dee02c88 --- /dev/null +++ b/annotations_filtered/voYRf2GVXbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [9.0, 9.15], [15.0, 17.14], [20.0, 21.15], [27.0, 28.11], [33.0, 36.37], [37.0, 64.83], [67.0, 69.31], [70.0, 70.83]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 98.01, 0.0, 0.0, 46.19, 44.99, 75.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 59.38], ["foghorn", 6.71], ["didgeridoo", 6.43]], [["music", 51.4], ["musical instrument", 6.81], ["cello", 6.11]], null, null], "duration": [0.32, 0.15, 2.14, 1.15, 1.11, 3.37, 27.83, 2.31, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/vozS5ppNzAM_filtered.json b/annotations_filtered/vozS5ppNzAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c800b1e4e6621874dfd2c41599e92fb0adce194 --- /dev/null +++ b/annotations_filtered/vozS5ppNzAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.42], [28.0, 52.89], [55.0, 55.86], [57.0, 59.02], [60.0, 61.8], [65.0, 66.99], [70.0, 77.06], [78.0, 80.84], [81.0, 81.5], [86.0, 87.12], [90.0, 100.25], [102.0, 103.05], [104.0, 109.21], [110.0, 112.14]], "keep_status": [false, false, false, true, false, false, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 33.77, 0.0, 38.78, 0.0, 0.0, 31.93, 54.36, 0.0, 0.0, 33.9, 0.0, 33.2, 35.38], "audiomae_on_audioset": [null, [["speech", 56.59], ["sidetone", 9.14], ["hum", 4.53]], null, [["speech", 45.32], ["noise", 10.27], ["hum", 5.79]], null, null, [["hum", 20.08], ["mains hum", 11.49], ["fly, housefly", 9.0]], null, null, null, [["mains hum", 21.25], ["hum", 17.84], ["vibration", 7.47]], null, [["electric shaver, electric razor", 30.51], ["hum", 10.65], ["livestock, farm animals, working animals", 4.16]], [["hum", 35.73], ["mains hum", 34.08], ["throbbing", 9.3]]], "duration": [0.42, 24.89, 0.86, 2.02, 1.8, 1.99, 7.06, 2.84, 0.5, 1.12, 10.25, 1.05, 5.21, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/vozjOGBUz2I_filtered.json b/annotations_filtered/vozjOGBUz2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f06e6684fd38b72c8768246100b194d7ab9ba3cb --- /dev/null +++ b/annotations_filtered/vozjOGBUz2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.29], [9.0, 10.74], [12.0, 14.84], [16.0, 17.9], [19.0, 19.72], [21.0, 21.24], [22.0, 22.2], [24.0, 31.06], [42.0, 45.25], [46.0, 46.28], [49.0, 50.19], [51.0, 53.0], [58.0, 58.02], [60.0, 61.15], [63.0, 63.07], [65.0, 65.92], [71.0, 73.35], [76.0, 76.67], [85.0, 88.91], [94.0, 97.93], [101.0, 101.49], [103.0, 103.55], [104.0, 104.87], [106.0, 106.59], [109.0, 112.18], [114.0, 114.79], [119.0, 119.6], [120.0, 120.29], [121.0, 121.64], [123.0, 123.09], [130.0, 129.95], [135.0, 135.28], [138.0, 141.13], [141.0, 141.69], [143.0, 143.18], [143.0, 143.99], [145.0, 149.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 74.76, 78.38, 0.0, 0.0, 55.67, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 96.54, 99.68, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 50.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.29, 1.74, 2.84, 1.9, 0.72, 0.24, 0.2, 7.06, 3.25, 0.28, 1.19, 2.0, 0.02, 1.15, 0.07, 0.92, 2.35, 0.67, 3.91, 3.93, 0.49, 0.55, 0.87, 0.59, 3.18, 0.79, 0.6, 0.29, 0.64, 0.09, -0.05, 0.28, 3.13, 0.69, 0.18, 0.99, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/vp7r-h8OLm0_filtered.json b/annotations_filtered/vp7r-h8OLm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..474d055e622acd92f64fb44c4c27255d393acefe --- /dev/null +++ b/annotations_filtered/vp7r-h8OLm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.8], [6.0, 6.94], [14.0, 14.79], [26.0, 32.73], [34.0, 35.33], [37.0, 37.94], [39.0, 40.9], [43.0, 44.0], [47.0, 49.57], [53.0, 52.76], [56.0, 58.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.52, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 98.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.8, 0.94, 0.79, 6.73, 1.33, 0.94, 1.9, 1.0, 2.57, -0.24, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/vpEAO0gIAxE_filtered.json b/annotations_filtered/vpEAO0gIAxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c740b66dd905fb6f85de300297c91f2d1c0d41 --- /dev/null +++ b/annotations_filtered/vpEAO0gIAxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [5.0, 6.39], [8.0, 12.77], [19.0, 21.83], [24.0, 26.76], [27.0, 29.13], [32.0, 34.77], [36.0, 39.29], [41.0, 44.91], [46.0, 48.12], [52.0, 55.29], [57.0, 59.49], [60.0, 62.99], [65.0, 66.7], [69.0, 69.53], [71.0, 72.79], [74.0, 78.8], [80.0, 84.45], [85.0, 90.51], [91.0, 95.22], [98.0, 100.82], [102.0, 105.87], [107.0, 110.37], [113.0, 116.5], [120.0, 123.21], [125.0, 126.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 92.31, 99.36, 99.78, 90.25, 99.97, 99.95, 86.82, 99.96, 99.99, 99.36, 75.55, 0.0, 0.0, 0.0, 97.43, 99.85, 99.76, 90.95, 99.93, 99.84, 99.94, 97.64, 82.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 1.39, 4.77, 2.83, 2.76, 2.13, 2.77, 3.29, 3.91, 2.12, 3.29, 2.49, 2.99, 1.7, 0.53, 1.79, 4.8, 4.45, 5.51, 4.22, 2.82, 3.87, 3.37, 3.5, 3.21, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/vpHEQqApoAY_filtered.json b/annotations_filtered/vpHEQqApoAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ab71425b440a136bc53ffa0d57fa0ae5e466d7 --- /dev/null +++ b/annotations_filtered/vpHEQqApoAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 3.52], [6.0, 6.59], [7.0, 8.21], [10.0, 10.79], [13.0, 13.64], [16.0, 16.7], [21.0, 21.52], [27.0, 27.55], [44.0, 47.39], [49.0, 49.23], [51.0, 51.66], [53.0, 54.89], [59.0, 59.34], [60.0, 61.32], [63.0, 63.17], [66.0, 66.99], [69.0, 69.15], [70.0, 71.9], [73.0, 74.46], [82.0, 83.12], [87.0, 86.81], [88.0, 88.75], [91.0, 92.47], [96.0, 96.01], [99.0, 99.28]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["didgeridoo", 35.94], ["dog", 10.44], ["animal", 8.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.52, 0.59, 1.21, 0.79, 0.64, 0.7, 0.52, 0.55, 3.39, 0.23, 0.66, 1.89, 0.34, 1.32, 0.17, 0.99, 0.15, 1.9, 1.46, 1.12, -0.19, 0.75, 1.47, 0.01, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/vpir9eGi8Mk_filtered.json b/annotations_filtered/vpir9eGi8Mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e18db05a2bc43bcfbb65d13fd6391a6c040d5c99 --- /dev/null +++ b/annotations_filtered/vpir9eGi8Mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 39.8], [42.0, 45.3], [49.0, 56.69], [58.0, 62.58], [65.0, 73.11], [74.0, 80.94], [82.0, 104.58], [109.0, 122.88], [126.0, 134.47], [143.0, 163.95], [165.0, 166.29]], "keep_status": [true, true, false, true, false, false, true, false, false, true, false], "silence_prob": [31.49, 31.04, 43.08, 47.39, 51.39, 47.5, 48.31, 43.64, 54.17, 32.58, 0.0], "audiomae_on_audioset": [[["music", 11.78], ["mains hum", 9.95], ["cacophony", 8.15]], [["music", 53.34], ["eruption", 5.26], ["musical instrument", 3.15]], [["music", 37.77], ["mains hum", 19.99], ["hum", 16.59]], [["music", 31.86], ["hum", 23.3], ["mains hum", 14.65]], null, [["music", 43.0], ["speech", 25.64], ["hum", 6.18]], [["music", 50.72], ["hum", 12.06], ["mains hum", 4.97]], [["music", 50.91], ["didgeridoo", 18.2], ["theremin", 6.29]], null, [["music", 52.85], ["throbbing", 6.16], ["percussion", 4.26]], null], "duration": [5.8, 3.3, 7.69, 4.58, 8.11, 6.94, 22.58, 13.88, 8.47, 20.95, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/vpqzFo0aD0c_filtered.json b/annotations_filtered/vpqzFo0aD0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77d25f4bfe0d7c4c5b28859d41900657d6c5b567 --- /dev/null +++ b/annotations_filtered/vpqzFo0aD0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.52], [13.0, 13.42], [14.0, 14.55], [36.0, 36.44], [42.0, 42.67], [47.0, 47.61], [50.0, 49.86], [59.0, 59.54], [62.0, 62.14], [66.0, 66.23], [69.0, 69.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.42, 0.55, 0.44, 0.67, 0.61, -0.14, 0.54, 0.14, 0.23, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/vq0OqfmArnY_filtered.json b/annotations_filtered/vq0OqfmArnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22508c67198f566d0cc0060e871f8cef87ff98b8 --- /dev/null +++ b/annotations_filtered/vq0OqfmArnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 32.02], [34.0, 95.37], [99.0, 99.27], [100.0, 100.95], [101.0, 102.91], [103.0, 104.45], [105.0, 108.13], [109.0, 111.57], [113.0, 114.05], [115.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 78.21, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [31.02, 61.37, 0.27, 0.95, 1.91, 1.45, 3.13, 2.57, 1.05, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/vq6ofw0hqkU_filtered.json b/annotations_filtered/vq6ofw0hqkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e25f24deb1d84d482c721fe0fa1b2a97fe30ce --- /dev/null +++ b/annotations_filtered/vq6ofw0hqkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.31], [13.0, 13.78], [18.0, 18.87], [21.0, 22.72], [24.0, 30.4], [34.0, 43.8], [45.0, 50.41], [54.0, 54.4], [56.0, 56.02], [63.0, 63.09], [68.0, 69.03], [70.0, 72.37], [74.0, 75.63], [81.0, 81.43], [84.0, 85.04], [86.0, 88.15], [89.0, 89.87], [96.0, 98.05], [100.0, 101.19], [103.0, 104.21], [106.0, 111.15], [112.0, 115.89], [116.0, 119.85], [122.0, 122.59], [124.0, 125.56], [127.0, 128.43], [129.0, 131.09]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.38, 35.01, 33.96, 0.0, 0.0, 0.0, 0.0, 32.87, 0.0, 0.0, 0.0, 42.28, 0.0, 44.6, 0.0, 0.0, 41.6, 53.28, 46.61, 0.0, 0.0, 0.0, 42.0], "audiomae_on_audioset": [null, null, null, null, [["noise", 18.17], ["fly, housefly", 11.17], ["breaking", 6.52]], [["breaking", 27.35], ["music", 25.36], ["speech", 14.37]], [["hum", 40.33], ["throbbing", 15.12], ["mains hum", 9.36]], null, null, null, null, [["whale vocalization", 47.07], ["hum", 13.39], ["throbbing", 5.63]], null, null, null, [["hum", 27.7], ["mains hum", 19.4], ["speech", 12.64]], null, [["speech", 32.78], ["mains hum", 19.91], ["hum", 8.64]], null, null, [["hum", 32.46], ["mains hum", 20.27], ["speech", 15.64]], null, [["mains hum", 32.67], ["hum", 29.7], ["music", 9.22]], null, null, null, [["mains hum", 18.58], ["music", 17.6], ["hum", 13.72]]], "duration": [1.31, 0.78, 0.87, 1.72, 6.4, 9.8, 5.41, 0.4, 0.02, 0.09, 1.03, 2.37, 1.63, 0.43, 1.04, 2.15, 0.87, 2.05, 1.19, 1.21, 5.15, 3.89, 3.85, 0.59, 1.56, 1.43, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/vq8OmtyOsR8_filtered.json b/annotations_filtered/vq8OmtyOsR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1a73a750dfcab4ae95d0358e686b56ab2103373 --- /dev/null +++ b/annotations_filtered/vq8OmtyOsR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.51], [6.0, 7.01], [9.0, 10.34], [18.0, 21.42], [22.0, 24.44], [33.0, 36.26], [47.0, 46.8], [55.0, 56.4], [58.0, 60.67], [65.0, 65.2], [76.0, 75.78], [94.0, 97.48], [111.0, 116.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 93.91, 61.87, 59.96, 0.0, 0.0, 80.46, 0.0, 0.0, 90.95, 56.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 1.01, 1.34, 3.42, 2.44, 3.26, -0.2, 1.4, 2.67, 0.2, -0.22, 3.48, 5.95]} \ No newline at end of file diff --git a/annotations_filtered/vqOByzMoS_A_filtered.json b/annotations_filtered/vqOByzMoS_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e06dd684f21d62eccc9f17efd67b0ae6ac09fe58 --- /dev/null +++ b/annotations_filtered/vqOByzMoS_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.54], [6.0, 6.45], [7.0, 12.26], [13.0, 13.46], [24.0, 24.27], [35.0, 36.48], [38.0, 38.23], [39.0, 40.22], [41.0, 42.36], [43.0, 43.9], [47.0, 47.46], [51.0, 51.9], [53.0, 54.58], [55.0, 57.59], [58.0, 58.92], [62.0, 63.05], [66.0, 66.43], [67.0, 67.51], [73.0, 73.31], [75.0, 75.61], [78.0, 78.68], [80.0, 81.03], [89.0, 96.96], [99.0, 100.43], [105.0, 105.87], [111.0, 111.84], [114.0, 114.94], [115.0, 116.67], [117.0, 118.62], [119.0, 119.21], [120.0, 127.18], [128.0, 128.49], [129.0, 129.51], [130.0, 130.62], [132.0, 133.69], [134.0, 139.62], [141.0, 143.61], [148.0, 148.15], [151.0, 151.38], [152.0, 152.69], [154.0, 154.3], [155.0, 159.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 45.46, 58.55, 0.0, 0.0, 0.0, 0.0, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.92], ["effects unit", 13.21], ["echo", 7.1]], null, null, null, null, [["music", 40.16], ["theremin", 9.44], ["musical instrument", 7.53]], null, null, null, null, null, null], "duration": [0.54, 0.45, 5.26, 0.46, 0.27, 1.48, 0.23, 1.22, 1.36, 0.9, 0.46, 0.9, 1.58, 2.59, 0.92, 1.05, 0.43, 0.51, 0.31, 0.61, 0.68, 1.03, 7.96, 1.43, 0.87, 0.84, 0.94, 1.67, 1.62, 0.21, 7.18, 0.49, 0.51, 0.62, 1.69, 5.62, 2.61, 0.15, 0.38, 0.69, 0.3, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/vqPT1IbJrX8_filtered.json b/annotations_filtered/vqPT1IbJrX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baca081c213eed6b1546859a54209b68216fa80d --- /dev/null +++ b/annotations_filtered/vqPT1IbJrX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.1], [15.0, 17.83], [19.0, 21.71], [22.0, 23.75], [27.0, 30.03], [31.0, 31.83], [39.0, 39.9], [43.0, 44.78], [47.0, 47.17], [52.0, 60.39], [63.0, 63.56], [67.0, 67.02], [72.0, 72.06], [73.0, 74.01], [74.0, 76.0], [80.0, 80.27], [82.0, 82.8], [85.0, 86.95], [88.0, 105.53], [107.0, 107.67], [108.0, 112.01], [114.0, 114.76], [117.0, 120.02], [123.0, 128.04], [130.0, 132.33], [133.0, 140.88], [145.0, 145.42], [146.0, 152.49], [158.0, 159.83], [162.0, 165.5], [168.0, 169.59], [176.0, 175.91], [180.0, 191.69], [192.0, 194.07], [195.0, 201.5], [202.0, 203.1], [204.0, 206.83], [209.0, 211.3], [214.0, 215.97], [219.0, 221.91], [229.0, 230.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 36.06, 56.4, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 48.78, 0.0, 0.0, 0.0, 34.62, 0.0, 33.48, 0.0, 30.79, 30.11, 37.34, 36.53, 0.0, 32.97, 0.0, 37.27, 0.0, 0.0, 34.68, 56.25, 52.39, 0.0, 85.17, 82.25, 0.0, 43.58, 0.0], "audiomae_on_audioset": [null, [["music", 35.6], ["speech", 30.6], ["hum", 4.08]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.03], ["speech", 13.41], ["synthesizer", 8.85]], null, null, null, [["music", 29.45], ["speech", 23.85], ["buzz", 7.79]], null, [["music", 23.23], ["hum", 21.63], ["throbbing", 21.41]], null, [["speech", 20.89], ["music", 12.33], ["electric shaver, electric razor", 3.81]], [["speech", 31.74], ["mains hum", 18.74], ["electric shaver, electric razor", 9.93]], [["music", 45.47], ["speech", 17.74], ["carnatic music", 7.37]], [["speech", 71.38], ["music", 5.92], ["explosion", 1.21]], null, [["music", 49.4], ["musical instrument", 6.04], ["didgeridoo", 5.54]], null, [["music", 46.41], ["speech", 9.11], ["electronic music", 7.54]], null, null, [["throbbing", 40.42], ["hum", 37.31], ["music", 10.18]], null, null, null, null, null, null, [["hum", 36.71], ["speech", 11.79], ["mains hum", 11.38]], null], "duration": [1.1, 2.83, 2.71, 1.75, 3.03, 0.83, 0.9, 1.78, 0.17, 8.39, 0.56, 0.02, 0.06, 1.01, 2.0, 0.27, 0.8, 1.95, 17.53, 0.67, 4.01, 0.76, 3.02, 5.04, 2.33, 7.88, 0.42, 6.49, 1.83, 3.5, 1.59, -0.09, 11.69, 2.07, 6.5, 1.1, 2.83, 2.3, 1.97, 2.91, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/vqlURGjq4AM_filtered.json b/annotations_filtered/vqlURGjq4AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5eb3fb05b5bf88191e09d487661ffc73e24498b8 --- /dev/null +++ b/annotations_filtered/vqlURGjq4AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [5.0, 6.29], [6.0, 8.02], [9.0, 11.82], [13.0, 13.54], [18.0, 19.13], [20.0, 21.29], [23.0, 24.04], [28.0, 28.31], [29.0, 31.11], [38.0, 41.4], [44.0, 45.66], [47.0, 47.58], [51.0, 52.05], [54.0, 53.92], [56.0, 58.28], [60.0, 60.66], [61.0, 62.14], [63.0, 68.34], [70.0, 71.52], [76.0, 77.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.07, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 1.29, 2.02, 2.82, 0.54, 1.13, 1.29, 1.04, 0.31, 2.11, 3.4, 1.66, 0.58, 1.05, -0.08, 2.28, 0.66, 1.14, 5.34, 1.52, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/vqqGZBRBLcM_filtered.json b/annotations_filtered/vqqGZBRBLcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d48d71e90078261fe2ae9594f0c8e06e4b237aa --- /dev/null +++ b/annotations_filtered/vqqGZBRBLcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.78], [11.0, 15.23], [16.0, 16.95], [21.0, 21.37], [22.0, 22.98], [28.0, 27.77], [29.0, 30.06], [36.0, 38.77], [43.0, 43.93], [48.0, 48.49], [55.0, 56.94], [60.0, 60.94], [71.0, 70.93], [72.0, 72.82], [76.0, 76.69], [77.0, 78.68], [82.0, 82.97], [83.0, 84.3], [86.0, 86.17], [89.0, 89.92], [91.0, 91.32], [92.0, 93.7], [95.0, 96.85], [101.0, 101.6], [103.0, 103.59], [104.0, 104.57], [106.0, 107.11], [108.0, 107.89], [113.0, 113.86], [115.0, 116.6], [119.0, 120.02], [120.0, 121.95], [124.0, 126.08], [126.0, 126.49], [127.0, 127.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 67.36], ["throbbing", 10.97], ["hum", 4.19]], null, null, null, null, null, [["explosion", 26.22], ["speech", 19.75], ["music", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.22, 4.23, 0.95, 0.37, 0.98, -0.23, 1.06, 2.77, 0.93, 0.49, 1.94, 0.94, -0.07, 0.82, 0.69, 1.68, 0.97, 1.3, 0.17, 0.92, 0.32, 1.7, 1.85, 0.6, 0.59, 0.57, 1.11, -0.11, 0.86, 1.6, 1.02, 1.95, 2.08, 0.49, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/vqxbLAcIgiw_filtered.json b/annotations_filtered/vqxbLAcIgiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b53e993f0c92c241ffc683b1032a63d93d2517f3 --- /dev/null +++ b/annotations_filtered/vqxbLAcIgiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.37], [24.0, 24.7], [39.0, 39.51], [41.0, 59.1]], "keep_status": [false, false, false, true], "silence_prob": [30.89, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["hum", 44.15], ["mains hum", 32.87], ["throbbing", 10.07]], null, null, [["music", 22.7], ["speech", 16.57], ["ding", 10.64]]], "duration": [8.37, 0.7, 0.51, 18.1]} \ No newline at end of file diff --git a/annotations_filtered/vr2jJkcTcxk_filtered.json b/annotations_filtered/vr2jJkcTcxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdff62e0c6961f4f97a27ff797329f9dbd97a63 --- /dev/null +++ b/annotations_filtered/vr2jJkcTcxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 18.22], [19.0, 20.01], [21.0, 23.19], [24.0, 24.95], [26.0, 26.35], [29.0, 29.12], [30.0, 31.68], [32.0, 34.64], [37.0, 37.84], [38.0, 39.75], [41.0, 42.72], [44.0, 44.66], [45.0, 46.9], [49.0, 51.22], [53.0, 55.58], [57.0, 58.4], [60.0, 63.1], [65.0, 66.12], [67.0, 68.12], [74.0, 75.59], [79.0, 79.15], [79.0, 83.27], [86.0, 86.91], [87.0, 87.66], [89.0, 89.43], [91.0, 95.42], [96.0, 96.4], [97.0, 98.09], [100.0, 100.62], [102.0, 106.08], [107.0, 108.18], [112.0, 115.72], [117.0, 122.98], [124.0, 125.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.64, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 60.79, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 39.35, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 85.35, 0.0, 57.56, 33.11, 0.0], "audiomae_on_audioset": [[["hum", 25.65], ["thunk", 21.15], ["throbbing", 7.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.42], ["speech synthesizer", 13.82], ["radio", 3.28]], null, null, null, null, null, null, null, null, null, null, [["music", 65.45], ["throbbing", 5.13], ["synthesizer", 4.29]], null], "duration": [7.22, 1.01, 2.19, 0.95, 0.35, 0.12, 1.68, 2.64, 0.84, 1.75, 1.72, 0.66, 1.9, 2.22, 2.58, 1.4, 3.1, 1.12, 1.12, 1.59, 0.15, 4.27, 0.91, 0.66, 0.43, 4.42, 0.4, 1.09, 0.62, 4.08, 1.18, 3.72, 5.98, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/vrCmp9js4YI_filtered.json b/annotations_filtered/vrCmp9js4YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a9a46cb2810b0fdfa01c3462090626aa7917296 --- /dev/null +++ b/annotations_filtered/vrCmp9js4YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [6.0, 6.57], [22.0, 22.35], [30.0, 31.26], [32.0, 33.42], [40.0, 39.77], [44.0, 44.71], [49.0, 50.43], [55.0, 56.35], [57.0, 57.43], [81.0, 82.21], [82.0, 82.85], [84.0, 86.24], [87.0, 88.96], [93.0, 95.61], [96.0, 96.57], [99.0, 100.41], [104.0, 104.41], [106.0, 108.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 99.31, 0.0, 0.0, 0.0, 99.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.57, 0.35, 1.26, 1.42, -0.23, 0.71, 1.43, 1.35, 0.43, 1.21, 0.85, 2.24, 1.96, 2.61, 0.57, 1.41, 0.41, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/vrEjev5DoXc_filtered.json b/annotations_filtered/vrEjev5DoXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cedc7d461fbf25bbfb92c03e97c4bcca02a6be93 --- /dev/null +++ b/annotations_filtered/vrEjev5DoXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [6.0, 7.84], [10.0, 11.38], [13.0, 13.47], [15.0, 16.06], [17.0, 18.15], [22.0, 23.03], [24.0, 25.84], [26.0, 27.31], [30.0, 30.75], [33.0, 74.88], [76.0, 76.84], [78.0, 81.43], [85.0, 85.72], [89.0, 92.5], [95.0, 96.43], [99.0, 100.31], [102.0, 105.29], [108.0, 113.59], [116.0, 121.8], [124.0, 130.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.42, 0.0, 34.46, 0.0, 0.0, 33.77, 34.57, 30.02, 28.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 41.49], ["hum", 24.06], ["music", 9.5]], null, [["sidetone", 36.63], ["speech", 16.21], ["mains hum", 12.51]], null, null, [["music", 34.44], ["hum", 14.07], ["breaking", 12.88]], [["music", 49.77], ["throbbing", 15.23], ["hum", 11.69]], [["music", 43.96], ["hum", 17.66], ["throbbing", 13.21]], [["music", 50.7], ["hum", 8.85], ["mains hum", 7.9]]], "duration": [0.67, 1.84, 1.38, 0.47, 1.06, 1.15, 1.03, 1.84, 1.31, 0.75, 41.88, 0.84, 3.43, 0.72, 3.5, 1.43, 1.31, 3.29, 5.59, 5.8, 6.27]} \ No newline at end of file diff --git a/annotations_filtered/vrVDJcw40BU_filtered.json b/annotations_filtered/vrVDJcw40BU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7c755f338251f199417640c8adf900905780748 --- /dev/null +++ b/annotations_filtered/vrVDJcw40BU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [11.0, 11.26], [14.0, 14.27], [16.0, 16.65], [17.0, 18.13], [25.0, 26.27], [32.0, 31.85], [35.0, 35.88], [42.0, 41.96], [42.0, 42.85], [46.0, 46.77], [47.0, 47.46], [51.0, 51.49], [52.0, 53.18], [54.0, 54.48], [59.0, 59.22], [72.0, 73.36], [89.0, 89.18], [90.0, 91.3], [92.0, 92.84], [98.0, 98.64], [105.0, 105.43], [114.0, 114.74], [123.0, 123.01], [124.0, 124.36], [155.0, 155.04], [156.0, 156.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.26, 0.27, 0.65, 1.13, 1.27, -0.15, 0.88, -0.04, 0.85, 0.77, 0.46, 0.49, 1.18, 0.48, 0.22, 1.36, 0.18, 1.3, 0.84, 0.64, 0.43, 0.74, 0.01, 0.36, 0.04, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/vrhgkmAzWvo_filtered.json b/annotations_filtered/vrhgkmAzWvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc3201a3b5835ffe57a15678687a6f51e2ab3f14 --- /dev/null +++ b/annotations_filtered/vrhgkmAzWvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.36], [18.0, 18.62], [33.0, 33.45], [49.0, 53.13], [55.0, 61.37], [62.0, 63.85], [66.0, 67.54], [82.0, 83.19], [87.0, 90.37], [92.0, 93.72], [95.0, 95.67], [97.0, 97.73], [100.0, 101.83], [107.0, 107.91], [108.0, 109.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.2, 72.46, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.62, 0.45, 4.13, 6.37, 1.85, 1.54, 1.19, 3.37, 1.72, 0.67, 0.73, 1.83, 0.91, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/vrujU3pc7-U_filtered.json b/annotations_filtered/vrujU3pc7-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcf5fe218ba4800e3ea2a922649837129b6b54bc --- /dev/null +++ b/annotations_filtered/vrujU3pc7-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.24], [33.0, 34.75], [36.0, 39.53], [41.0, 41.64], [53.0, 53.92], [60.0, 68.74], [71.0, 73.08], [78.0, 80.38], [83.0, 85.19]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.37, 0.0, 0.0, 48.95, 54.36, 53.78, 61.77], "audiomae_on_audioset": [null, null, null, null, null, [["music", 83.0], ["ambient music", 3.7], ["theremin", 3.1]], null, null, null], "duration": [1.24, 1.75, 3.53, 0.64, 0.92, 8.74, 2.08, 2.38, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/vsBwRV2b3LY_filtered.json b/annotations_filtered/vsBwRV2b3LY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3c9258d190bc93af129c282548ac49f12f4703b --- /dev/null +++ b/annotations_filtered/vsBwRV2b3LY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 23.3], [26.0, 26.3], [30.0, 31.09], [32.0, 32.56], [53.0, 53.42], [56.0, 56.44], [61.0, 61.33], [68.0, 68.69], [71.0, 70.73], [72.0, 73.21], [80.0, 81.53], [88.0, 88.97], [90.0, 90.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 83.62], ["musical instrument", 3.96], ["sampler", 1.2]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.3, 0.3, 1.09, 0.56, 0.42, 0.44, 0.33, 0.69, -0.27, 1.21, 1.53, 0.97, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/vsQak7aKH30_filtered.json b/annotations_filtered/vsQak7aKH30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1725cfaac4c3ff862f095e798aff17a3dee42b8 --- /dev/null +++ b/annotations_filtered/vsQak7aKH30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [6.0, 6.45], [8.0, 9.17], [15.0, 15.2], [20.0, 21.25], [23.0, 23.89], [25.0, 26.45], [29.0, 29.17], [38.0, 38.64], [55.0, 55.31], [77.0, 78.0], [87.0, 87.45], [103.0, 104.26], [117.0, 118.02], [124.0, 124.65], [125.0, 133.78], [134.0, 134.59], [135.0, 138.18], [140.0, 140.76], [142.0, 142.2], [144.0, 145.08], [150.0, 150.3], [156.0, 156.02], [157.0, 157.86], [159.0, 163.76], [165.0, 165.35], [166.0, 166.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.45, 1.17, 0.2, 1.25, 0.89, 1.45, 0.17, 0.64, 0.31, 1.0, 0.45, 1.26, 1.02, 0.65, 8.78, 0.59, 3.18, 0.76, 0.2, 1.08, 0.3, 0.02, 0.86, 4.76, 0.35, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/vsU27J8K3Tw_filtered.json b/annotations_filtered/vsU27J8K3Tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e8bb97c11485c63738e6403515dc3837aba84c --- /dev/null +++ b/annotations_filtered/vsU27J8K3Tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 66.33], [67.0, 75.68], [77.0, 78.73], [79.0, 81.63], [83.0, 85.41], [87.0, 89.01]], "keep_status": [false, true, false, false, true, false], "silence_prob": [50.06, 48.61, 0.0, 51.34, 38.02, 54.36], "audiomae_on_audioset": [null, [["speech", 38.79], ["sidetone", 15.27], ["hum", 7.92]], null, null, [["whale vocalization", 29.55], ["hum", 15.38], ["music", 8.86]], null], "duration": [8.33, 8.68, 1.73, 2.63, 2.41, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/vsevdTMBfC8_filtered.json b/annotations_filtered/vsevdTMBfC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7688575bcb6bbc76e2f75532ac89f392ca31f5fe --- /dev/null +++ b/annotations_filtered/vsevdTMBfC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.09], [18.0, 18.69], [19.0, 21.52], [23.0, 24.04], [25.0, 26.01], [38.0, 40.42], [41.0, 42.87], [44.0, 44.19], [46.0, 48.34]], "keep_status": [false, false, true, false, false, false, false, false, true], "silence_prob": [31.54, 0.0, 37.01, 0.0, 0.0, 92.8, 0.0, 0.0, 45.3], "audiomae_on_audioset": [[["speech", 71.34], ["thunk", 5.62], ["knock", 4.22]], null, [["coin (dropping)", 32.44], ["speech", 23.7], ["creak", 10.65]], null, null, null, null, null, [["speech", 44.69], ["sidetone", 12.8], ["sine wave", 11.0]]], "duration": [3.09, 0.69, 2.52, 1.04, 1.01, 2.42, 1.87, 0.19, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/vsfjzfGZVyQ_filtered.json b/annotations_filtered/vsfjzfGZVyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31031e4730892f7615fb94f741f8f1f757402c4d --- /dev/null +++ b/annotations_filtered/vsfjzfGZVyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [6.0, 10.56], [12.0, 12.87], [15.0, 15.55], [21.0, 22.86], [24.0, 25.25], [28.0, 29.2], [36.0, 40.63], [45.0, 45.81], [51.0, 51.88], [54.0, 54.95], [59.0, 63.19], [64.0, 67.19], [74.0, 75.57], [76.0, 78.9], [80.0, 80.72], [82.0, 82.97], [84.0, 84.55], [89.0, 89.56], [91.0, 92.13], [93.0, 95.22], [99.0, 100.57], [102.0, 106.61], [108.0, 108.78], [110.0, 111.38], [113.0, 114.4], [117.0, 120.21], [123.0, 129.68]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.33, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 81.71, 79.24, 0.0, 45.27, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 56.48, 0.0, 0.0, 0.0, 62.27, 65.79], "audiomae_on_audioset": [null, [["sidetone", 20.63], ["speech", 20.54], ["hum", 7.16]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.49], ["didgeridoo", 13.14], ["theremin", 4.33]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 4.56, 0.87, 0.55, 1.86, 1.25, 1.2, 4.63, 0.81, 0.88, 0.95, 4.19, 3.19, 1.57, 2.9, 0.72, 0.97, 0.55, 0.56, 1.13, 2.22, 1.57, 4.61, 0.78, 1.38, 1.4, 3.21, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/vt0hblIsHiY_filtered.json b/annotations_filtered/vt0hblIsHiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5db427c778e75eb78bedca1e8c5bcf7916a05fb9 --- /dev/null +++ b/annotations_filtered/vt0hblIsHiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 44.79], [46.0, 49.27], [50.0, 50.53], [57.0, 58.24], [59.0, 59.48], [65.0, 67.61], [69.0, 69.3], [70.0, 82.71], [116.0, 117.44], [122.0, 122.39], [126.0, 126.54], [129.0, 128.98], [143.0, 143.56], [144.0, 145.07]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.82, 33.97, 0.0, 0.0, 0.0, 32.31, 0.0, 33.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 51.55], ["music", 9.59], ["fart", 8.47]], [["music", 25.18], ["fly, housefly", 12.82], ["throbbing", 9.04]], null, null, null, [["music", 46.68], ["boing", 24.22], ["speech", 8.27]], null, [["music", 51.84], ["speech", 31.4], ["drum machine", 2.06]], null, null, null, null, null, null], "duration": [18.79, 3.27, 0.53, 1.24, 0.48, 2.61, 0.3, 12.71, 1.44, 0.39, 0.54, -0.02, 0.56, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/vtjCVRm2DAM_filtered.json b/annotations_filtered/vtjCVRm2DAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eba654833123737843d92e00625f623637625eb --- /dev/null +++ b/annotations_filtered/vtjCVRm2DAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.87], [5.0, 7.06], [13.0, 12.82], [14.0, 14.74], [19.0, 20.17], [23.0, 24.38], [25.0, 27.35], [28.0, 27.82], [28.0, 30.54], [33.0, 58.58], [59.0, 65.82], [68.0, 70.61], [72.0, 74.76], [76.0, 77.35], [80.0, 88.84]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 67.38, 31.6, 35.63, 88.28, 82.79, 0.0, 37.61], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 16.4], ["hum", 9.71], ["mains hum", 8.19]], null, null, [["music", 56.71], ["sound effect", 4.78], ["breaking", 4.29]], [["music", 43.29], ["throbbing", 11.77], ["hum", 9.37]], null, null, null, [["music", 44.56], ["throbbing", 7.23], ["hum", 6.81]]], "duration": [1.87, 2.06, -0.18, 0.74, 1.17, 1.38, 2.35, -0.18, 2.54, 25.58, 6.82, 2.61, 2.76, 1.35, 8.84]} \ No newline at end of file diff --git a/annotations_filtered/vtxPupFohQA_filtered.json b/annotations_filtered/vtxPupFohQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..672b93830c6fcd11c9c27ae6b3e7e89663a11ff2 --- /dev/null +++ b/annotations_filtered/vtxPupFohQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [3.0, 3.72], [5.0, 6.59], [8.0, 13.76], [15.0, 15.16], [17.0, 17.78], [21.0, 23.3], [24.0, 25.08], [28.0, 27.82], [28.0, 27.85], [28.0, 28.12], [28.0, 30.91], [34.0, 34.59], [36.0, 35.94], [37.0, 77.03], [78.0, 104.13], [110.0, 123.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 61.57, 0.0, 0.0, 0.0, 0.0, 30.61, 0.0, 0.0, 0.0, 32.28, 32.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["noise", 13.14], ["hum", 11.83], ["cacophony", 10.76]], null, null, null, [["music", 73.35], ["musical instrument", 3.41], ["throbbing", 2.96]], [["music", 72.17], ["musical instrument", 5.76], ["brass instrument", 2.04]]], "duration": [0.1, 0.72, 1.59, 5.76, 0.16, 0.78, 2.3, 1.08, -0.18, -0.15, 0.12, 2.91, 0.59, -0.06, 40.03, 26.13, 13.58]} \ No newline at end of file diff --git a/annotations_filtered/vtxo451I_Qk_filtered.json b/annotations_filtered/vtxo451I_Qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ab53b42223544232eb0326a54066d3abbbc0e24 --- /dev/null +++ b/annotations_filtered/vtxo451I_Qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 72.57], [73.0, 85.29], [85.0, 85.55]], "keep_status": [false, false, false], "silence_prob": [0.0, 30.35, 0.0], "audiomae_on_audioset": [null, [["music", 76.84], ["electronic music", 9.66], ["dubstep", 4.47]], null], "duration": [67.57, 12.29, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/vtyIGp8uv8w_filtered.json b/annotations_filtered/vtyIGp8uv8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f292770807bceaafb2c64f1ab55fbe1d63eb37f --- /dev/null +++ b/annotations_filtered/vtyIGp8uv8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.59], [15.0, 16.04], [17.0, 17.63], [18.0, 26.97], [28.0, 28.32], [32.0, 49.55], [52.0, 52.86], [55.0, 55.22], [62.0, 61.77], [71.0, 74.66], [79.0, 87.69], [91.0, 95.25], [100.0, 105.46], [107.0, 109.38], [111.0, 116.88], [118.0, 129.05], [131.0, 131.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.51, 0.0, 52.45, 0.0, 0.0, 0.0, 52.56, 57.48, 58.98, 58.55, 45.98, 47.9, 47.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.6], ["music", 25.02], ["mains hum", 12.03]], [["music", 74.16], ["ambient music", 5.04], ["synthesizer", 2.92]], [["music", 82.01], ["ambient music", 6.46], ["hum", 0.99]], null], "duration": [1.59, 1.04, 0.63, 8.97, 0.32, 17.55, 0.86, 0.22, -0.23, 3.66, 8.69, 4.25, 5.46, 2.38, 5.88, 11.05, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/vubylfvbMhk_filtered.json b/annotations_filtered/vubylfvbMhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c949821bd2fec50aac22dd28bbf71c547178b297 --- /dev/null +++ b/annotations_filtered/vubylfvbMhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.65], [24.0, 25.15], [30.0, 30.48], [40.0, 42.25], [53.0, 52.86], [53.0, 53.7], [74.0, 74.46], [77.0, 80.59], [82.0, 94.66], [110.0, 110.67], [112.0, 112.48], [113.0, 113.81]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 44.6, 31.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 43.99], ["fly, housefly", 6.36], ["theremin", 4.57]], [["speech", 38.34], ["music", 15.49], ["boing", 10.49]], null, null, null], "duration": [2.65, 1.15, 0.48, 2.25, -0.14, 0.7, 0.46, 3.59, 12.66, 0.67, 0.48, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/vuuTS_WNw5w_filtered.json b/annotations_filtered/vuuTS_WNw5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14e083293e33b33a24d2fb9c3ede0775f8cbd7a9 --- /dev/null +++ b/annotations_filtered/vuuTS_WNw5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.84], [13.0, 13.95], [15.0, 15.87], [19.0, 19.7], [20.0, 20.9], [22.0, 22.86], [25.0, 25.79], [28.0, 27.9], [30.0, 37.69], [39.0, 40.69], [42.0, 46.94], [47.0, 48.44], [53.0, 53.54], [54.0, 54.3], [56.0, 59.19], [61.0, 60.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 41.38, 0.0, 0.0, 0.0, 89.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 14.5], ["fly, housefly", 11.93], ["insect", 10.92]], null, null, null, null, null], "duration": [1.84, 0.95, 0.87, 0.7, 0.9, 0.86, 0.79, -0.1, 7.69, 1.69, 4.94, 1.44, 0.54, 0.3, 3.19, -0.19]} \ No newline at end of file diff --git a/annotations_filtered/vvBW4Szes1U_filtered.json b/annotations_filtered/vvBW4Szes1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6511a13cf43d85684ca419ada207e1d21a73128c --- /dev/null +++ b/annotations_filtered/vvBW4Szes1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [3.0, 4.35], [6.0, 10.54], [11.0, 15.62], [18.0, 18.32], [19.0, 20.33], [21.0, 22.47], [23.0, 24.85], [26.0, 28.61], [29.0, 31.24], [32.0, 37.29], [38.0, 40.86], [42.0, 43.85], [45.0, 45.17], [46.0, 47.78], [49.0, 50.97], [52.0, 53.97], [55.0, 64.13], [66.0, 72.03], [73.0, 74.33], [75.0, 77.62], [78.0, 105.16], [106.0, 108.38], [109.0, 113.31], [115.0, 119.75], [120.0, 119.87], [122.0, 129.24], [131.0, 130.98]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 37.09, 42.69, 0.0, 0.0, 0.0, 0.0, 43.93, 69.61, 65.09, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 50.91, 53.34, 0.0, 41.81, 34.74, 42.6, 44.69, 37.64, 0.0, 32.06, 0.0], "audiomae_on_audioset": [null, null, [["cough", 18.66], ["throat clearing", 16.77], ["music", 15.26]], [["speech", 48.93], ["music", 27.22], ["inside, small room", 2.96]], null, null, null, null, [["music", 36.7], ["hum", 13.84], ["speech", 12.62]], null, null, null, null, null, null, null, null, null, null, null, [["music", 39.87], ["crushing", 23.11], ["musical instrument", 2.54]], [["music", 59.2], ["hum", 8.43], ["keyboard (musical)", 3.74]], [["music", 50.15], ["musical instrument", 7.08], ["synthesizer", 3.67]], [["music", 65.65], ["didgeridoo", 7.98], ["musical instrument", 4.87]], [["music", 46.8], ["synthesizer", 11.1], ["theremin", 6.18]], null, [["music", 52.09], ["synthesizer", 6.68], ["musical instrument", 5.6]], null], "duration": [0.44, 1.35, 4.54, 4.62, 0.32, 1.33, 1.47, 1.85, 2.61, 2.24, 5.29, 2.86, 1.85, 0.17, 1.78, 1.97, 1.97, 9.13, 6.03, 1.33, 2.62, 27.16, 2.38, 4.31, 4.75, -0.13, 7.24, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/vvDkLhvUa2o_filtered.json b/annotations_filtered/vvDkLhvUa2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faccffa260647fd48cccd9a1951a8c01b733f176 --- /dev/null +++ b/annotations_filtered/vvDkLhvUa2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.3], [34.0, 45.62], [49.0, 50.46]], "keep_status": [false, true, false], "silence_prob": [0.0, 30.16, 0.0], "audiomae_on_audioset": [null, [["buzz", 38.12], ["speech", 9.46], ["hum", 5.88]], null], "duration": [1.3, 11.62, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/vw1dPsf0JgE_filtered.json b/annotations_filtered/vw1dPsf0JgE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60f3b7ba132ea22b1ab59c5b3f9ef04e8c2cab9f --- /dev/null +++ b/annotations_filtered/vw1dPsf0JgE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [4.0, 5.43], [6.0, 8.5], [13.0, 17.98], [19.0, 18.89], [20.0, 21.64], [26.0, 28.36], [45.0, 46.68], [48.0, 53.35], [56.0, 60.18], [60.0, 63.39], [64.0, 70.95], [74.0, 82.59], [84.0, 85.18], [87.0, 98.34], [99.0, 101.07], [106.0, 107.7], [108.0, 112.75]], "keep_status": [false, false, false, false, false, false, true, false, true, true, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 64.41, 57.97, 0.0, 0.0, 30.0, 0.0, 43.13, 46.68, 38.93, 44.66, 55.67, 0.0, 37.51, 39.96, 0.0, 52.39], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 20.6], ["music", 14.33], ["speech", 9.42]], null, [["hum", 34.94], ["speech", 15.26], ["mains hum", 13.17]], [["whale vocalization", 29.22], ["sidetone", 28.87], ["stomach rumble", 8.89]], [["frog", 20.91], ["croak", 13.74], ["hum", 10.51]], [["speech", 31.27], ["radio", 14.17], ["rumble", 9.67]], null, null, [["speech", 62.12], ["hum", 5.81], ["knock", 3.68]], [["fly, housefly", 39.15], ["mosquito", 17.85], ["insect", 10.62]], null, null], "duration": [0.4, 1.43, 2.5, 4.98, -0.11, 1.64, 2.36, 1.68, 5.35, 4.18, 3.39, 6.95, 8.59, 1.18, 11.34, 2.07, 1.7, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/vw44oj_STSw_filtered.json b/annotations_filtered/vw44oj_STSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b7748abea6094981f477224b274c66b6441d6d --- /dev/null +++ b/annotations_filtered/vw44oj_STSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.34], [29.0, 29.67], [35.0, 35.02], [35.0, 35.24], [36.0, 36.56], [43.0, 43.61], [50.0, 51.19], [69.0, 69.9], [70.0, 70.28], [70.0, 71.0], [72.0, 72.76], [78.0, 78.9], [80.0, 80.72], [85.0, 85.23], [96.0, 97.06], [98.0, 98.54], [100.0, 100.8], [112.0, 112.85], [114.0, 114.54], [118.0, 118.23], [130.0, 131.08], [135.0, 137.34], [138.0, 138.43], [140.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.67, 0.02, 0.24, 0.56, 0.61, 1.19, 0.9, 0.28, 1.0, 0.76, 0.9, 0.72, 0.23, 1.06, 0.54, 0.8, 0.85, 0.54, 0.23, 1.08, 2.34, 0.43, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/vwbryjr2BKg_filtered.json b/annotations_filtered/vwbryjr2BKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ba5ced131f433748e7bc8930877d68bf5283bf7 --- /dev/null +++ b/annotations_filtered/vwbryjr2BKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [7.0, 7.2], [10.0, 11.33], [16.0, 16.75], [18.0, 19.5], [23.0, 24.09], [43.0, 44.56], [52.0, 52.88], [53.0, 53.43], [54.0, 54.87], [58.0, 59.19], [60.0, 61.37], [62.0, 67.31], [68.0, 71.36], [74.0, 74.11], [76.0, 77.41], [78.0, 78.95], [80.0, 97.65], [99.0, 99.5], [101.0, 102.83], [105.0, 106.71], [109.0, 109.97], [112.0, 112.78], [115.0, 116.6], [120.0, 119.75], [126.0, 128.51], [129.0, 135.31], [136.0, 137.79], [138.0, 144.42], [145.0, 149.08], [151.0, 150.8], [152.0, 153.37], [154.0, 154.53], [155.0, 158.8], [161.0, 163.04], [164.0, 164.4], [166.0, 167.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 99.71, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.73, 0.0, 95.09, 98.36, 0.0, 0.0, 0.0, 91.13, 73.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.65, 0.2, 1.33, 0.75, 1.5, 1.09, 1.56, 0.88, 0.43, 0.87, 1.19, 1.37, 5.31, 3.36, 0.11, 1.41, 0.95, 17.65, 0.5, 1.83, 1.71, 0.97, 0.78, 1.6, -0.25, 2.51, 6.31, 1.79, 6.42, 4.08, -0.2, 1.37, 0.53, 3.8, 2.04, 0.4, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/vxFr0xNspFU_filtered.json b/annotations_filtered/vxFr0xNspFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2e18c5324c14ea52e75efc134fe49c89efe7896 --- /dev/null +++ b/annotations_filtered/vxFr0xNspFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.13], [13.0, 22.23], [24.0, 30.64], [31.0, 32.88], [38.0, 39.04], [41.0, 42.69], [43.0, 44.88], [45.0, 50.84]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [45.4, 33.6, 46.19, 0.0, 0.0, 0.0, 0.0, 38.58], "audiomae_on_audioset": [[["music", 47.65], ["squish", 13.02], ["whale vocalization", 9.64]], [["music", 79.41], ["breaking", 5.05], ["buzz", 2.41]], [["music", 56.03], ["whale vocalization", 17.5], ["pour", 3.35]], null, null, null, null, [["music", 50.6], ["whale vocalization", 15.19], ["speech", 7.6]]], "duration": [2.13, 9.23, 6.64, 1.88, 1.04, 1.69, 1.88, 5.84]} \ No newline at end of file diff --git a/annotations_filtered/vyMggFe9WRQ_filtered.json b/annotations_filtered/vyMggFe9WRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7cd3dda7601c7b740d7fad7f7305996b3e45c49 --- /dev/null +++ b/annotations_filtered/vyMggFe9WRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [5.0, 5.98], [10.0, 10.99], [13.0, 15.9], [20.0, 20.31], [22.0, 22.3], [23.0, 23.75], [27.0, 28.8], [29.0, 30.74], [34.0, 35.43], [38.0, 40.64], [42.0, 45.17], [46.0, 46.67], [48.0, 49.65], [54.0, 54.51], [56.0, 56.4], [65.0, 68.28], [70.0, 74.41], [75.0, 75.63], [78.0, 79.91], [80.0, 83.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 52.51, 0.0, 0.0, 0.0, 0.0, 66.03, 66.03, 0.0, 0.0, 42.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.11], ["sine wave", 18.09], ["chirp tone", 17.14]]], "duration": [1.38, 0.98, 0.99, 2.9, 0.31, 0.3, 0.75, 1.8, 1.74, 1.43, 2.64, 3.17, 0.67, 1.65, 0.51, 0.4, 3.28, 4.41, 0.63, 1.91, 3.98]} \ No newline at end of file diff --git a/annotations_filtered/vyN2oD5tI80_filtered.json b/annotations_filtered/vyN2oD5tI80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0547b9c6a716ea39d907bc5628109e91a77d296 --- /dev/null +++ b/annotations_filtered/vyN2oD5tI80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [13.0, 14.15], [14.0, 19.55], [26.0, 26.55], [31.0, 31.83], [33.0, 33.84], [41.0, 41.64], [65.0, 65.92], [68.0, 68.86], [73.0, 74.19], [84.0, 89.53], [90.0, 89.78], [90.0, 89.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 78.76], ["hum", 4.07], ["mains hum", 3.59]], null, null, null, null, null, null, null, [["music", 31.8], ["speech", 30.88], ["cowbell", 6.35]], null, null], "duration": [0.38, 1.15, 5.55, 0.55, 0.83, 0.84, 0.64, 0.92, 0.86, 1.19, 5.53, -0.22, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/vyb2Imfghkg_filtered.json b/annotations_filtered/vyb2Imfghkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..517cd324e6771a759e1fe189a8541ac1f40e5e90 --- /dev/null +++ b/annotations_filtered/vyb2Imfghkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.52], [11.0, 15.28], [16.0, 17.15], [17.0, 24.73], [27.0, 29.44], [37.0, 42.48], [43.0, 48.96], [54.0, 54.51], [57.0, 57.57], [60.0, 60.34], [62.0, 62.73], [71.0, 71.85], [75.0, 82.36], [87.0, 87.74], [91.0, 91.27], [92.0, 93.34], [94.0, 94.71], [97.0, 98.74], [101.0, 100.97], [102.0, 103.06], [104.0, 104.33], [106.0, 106.91], [109.0, 109.43], [119.0, 119.18], [126.0, 130.18], [131.0, 132.22], [134.0, 133.62], [136.0, 138.47], [140.0, 142.92], [145.0, 146.16], [151.0, 154.4], [155.0, 156.49], [157.0, 157.0], [159.0, 160.98], [169.0, 173.01]], "keep_status": [true, true, false, false, true, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [46.75, 43.2, 0.0, 32.05, 37.09, 42.81, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 37.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 74.92, 49.68, 0.0, 46.79, 0.0, 0.0, 0.0, 42.67], "audiomae_on_audioset": [[["music", 42.79], ["speech", 4.9], ["animal", 4.44]], [["music", 55.19], ["glockenspiel", 4.22], ["speech", 4.02]], null, [["music", 69.27], ["speech", 7.18], ["theremin", 4.52]], [["music", 35.64], ["speech", 12.22], ["foghorn", 9.16]], [["music", 27.16], ["speech", 6.64], ["brass instrument", 6.14]], [["music", 30.44], ["speech", 25.71], ["foghorn", 8.69]], null, null, null, null, null, [["music", 53.23], ["synthesizer", 10.58], ["musical instrument", 3.88]], null, null, null, null, null, null, null, null, null, null, null, [["music", 57.76], ["theremin", 5.93], ["synthesizer", 4.04]], null, null, null, [["mosquito", 32.52], ["fly, housefly", 12.23], ["music", 7.9]], null, [["music", 35.95], ["speech", 7.54], ["didgeridoo", 5.64]], null, null, null, [["music", 34.08], ["mains hum", 13.89], ["hum", 10.44]]], "duration": [2.52, 4.28, 1.15, 7.73, 2.44, 5.48, 5.96, 0.51, 0.57, 0.34, 0.73, 0.85, 7.36, 0.74, 0.27, 1.34, 0.71, 1.74, -0.03, 1.06, 0.33, 0.91, 0.43, 0.18, 4.18, 1.22, -0.38, 2.47, 2.92, 1.16, 3.4, 1.49, 0.0, 1.98, 4.01]} \ No newline at end of file diff --git a/annotations_filtered/vykvU-52g6w_filtered.json b/annotations_filtered/vykvU-52g6w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19e2147540c665fd81351241ba10979ef9bfd3aa --- /dev/null +++ b/annotations_filtered/vykvU-52g6w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.05], [3.0, 6.67], [9.0, 11.13], [23.0, 22.96], [25.0, 25.14], [28.0, 27.89], [38.0, 39.45], [45.0, 48.24], [51.0, 51.14], [54.0, 56.1], [57.0, 57.35], [60.0, 60.3], [62.0, 63.14], [70.0, 70.44], [73.0, 73.33], [77.0, 80.08], [83.0, 83.46], [86.0, 128.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 84.07, 99.95, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["effects unit", 15.33], ["noise", 13.98], ["music", 9.44]], null, null], "duration": [0.05, 3.67, 2.13, -0.04, 0.14, -0.11, 1.45, 3.24, 0.14, 2.1, 0.35, 0.3, 1.14, 0.44, 0.33, 3.08, 0.46, 42.65]} \ No newline at end of file diff --git a/annotations_filtered/vz2RAznAy9Q_filtered.json b/annotations_filtered/vz2RAznAy9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c92f7ea259b2f99f8efbfc7f7b8c16428f05e567 --- /dev/null +++ b/annotations_filtered/vz2RAznAy9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.01], [21.0, 22.15], [23.0, 23.77], [27.0, 30.42], [32.0, 35.68], [38.0, 39.21], [44.0, 44.47], [49.0, 49.74], [53.0, 54.03], [56.0, 56.84], [59.0, 61.08], [63.0, 64.64], [69.0, 69.99], [73.0, 74.87], [75.0, 78.93], [80.0, 80.76], [81.0, 82.49], [83.0, 83.24], [84.0, 87.49], [89.0, 90.24], [91.0, 94.31], [95.0, 99.52], [101.0, 101.16], [102.0, 103.99], [112.0, 113.56], [120.0, 121.44], [122.0, 124.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.71, 0.0, 0.0, 99.84, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 98.73, 0.0, 55.18, 80.46, 0.0, 0.0, 0.0, 0.0, 52.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.01, 1.15, 0.77, 3.42, 3.68, 1.21, 0.47, 0.74, 1.03, 0.84, 2.08, 1.64, 0.99, 1.87, 3.93, 0.76, 1.49, 0.24, 3.49, 1.24, 3.31, 4.52, 0.16, 1.99, 1.56, 1.44, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/vzt7Yb_-yiY_filtered.json b/annotations_filtered/vzt7Yb_-yiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b6601d0427286ac00aafd612fb499bcdd323017 --- /dev/null +++ b/annotations_filtered/vzt7Yb_-yiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.04], [20.0, 19.85], [20.0, 20.31], [22.0, 24.33], [25.0, 25.52], [27.0, 27.63], [28.0, 29.54], [32.0, 33.59], [35.0, 41.35], [43.0, 42.87], [44.0, 44.32], [47.0, 48.24], [49.0, 49.4], [54.0, 56.84], [58.0, 59.31], [66.0, 74.82], [78.0, 80.94], [82.0, 99.87], [101.0, 107.3], [107.0, 124.02], [125.0, 125.47], [126.0, 126.77], [127.0, 129.1]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.24, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 41.72, 0.0, 45.88, 37.91, 36.24, 38.8, 39.6, 0.0, 0.0, 54.9], "audiomae_on_audioset": [null, null, null, [["speech", 43.88], ["fart", 9.91], ["hum", 4.39]], null, null, null, null, null, null, null, null, null, [["speech", 11.48], ["mains hum", 5.96], ["buzz", 5.3]], null, [["fly, housefly", 27.14], ["hum", 19.81], ["insect", 10.68]], [["hum", 16.55], ["throbbing", 9.51], ["music", 7.38]], [["music", 49.73], ["hum", 14.02], ["ambient music", 6.59]], [["hum", 37.49], ["throbbing", 31.86], ["mains hum", 19.89]], [["hum", 28.41], ["music", 25.44], ["speech", 11.24]], null, null, null], "duration": [1.04, -0.15, 0.31, 2.33, 0.52, 0.63, 1.54, 1.59, 6.35, -0.13, 0.32, 1.24, 0.4, 2.84, 1.31, 8.82, 2.94, 17.87, 6.3, 17.02, 0.47, 0.77, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/vzzuOkCkHlQ_filtered.json b/annotations_filtered/vzzuOkCkHlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65c6a6406a0bbfac54e5a89b899f197bfb717f59 --- /dev/null +++ b/annotations_filtered/vzzuOkCkHlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.92], [9.0, 10.0], [11.0, 11.72], [13.0, 13.9], [15.0, 16.78], [18.0, 18.72], [21.0, 22.37], [23.0, 38.08], [40.0, 40.14], [49.0, 49.94], [61.0, 74.26], [81.0, 82.14], [83.0, 83.54], [86.0, 86.27]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.28, 0.0, 0.0, 36.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["insect", 12.22], ["fly, housefly", 11.09], ["wild animals", 10.65]], null, null, [["music", 37.08], ["speech", 25.07], ["ice cream truck, ice cream van", 12.24]], null, null, null], "duration": [-0.08, 1.0, 0.72, 0.9, 1.78, 0.72, 1.37, 15.08, 0.14, 0.94, 13.26, 1.14, 0.54, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/w-6lVMklaKY_filtered.json b/annotations_filtered/w-6lVMklaKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d437dc150cc64a07e68ce943fe6c90892a8cc5 --- /dev/null +++ b/annotations_filtered/w-6lVMklaKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 61.23], [61.0, 63.81], [64.0, 65.08], [69.0, 69.3], [72.0, 73.14], [79.0, 89.94], [91.0, 91.57], [94.0, 95.05], [96.0, 100.72], [102.0, 107.89], [109.0, 109.49], [111.0, 114.57], [118.0, 117.95], [119.0, 123.18], [127.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.94, 41.93, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.99, 0.0, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [[["hum", 54.71], ["mains hum", 18.63], ["throbbing", 17.3]], [["speech", 71.15], ["sidetone", 8.02], ["music", 3.84]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.23, 2.81, 1.08, 0.3, 1.14, 10.94, 0.57, 1.05, 4.72, 5.89, 0.49, 3.57, -0.05, 4.18, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/w-A750XbFAo_filtered.json b/annotations_filtered/w-A750XbFAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cf02872c7dca1a4073d77dfab1b99311e7c6fca --- /dev/null +++ b/annotations_filtered/w-A750XbFAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 68.69], [69.0, 71.27], [71.0, 74.9], [75.0, 100.36], [102.0, 141.96], [142.0, 149.08]], "keep_status": [false, false, false, false, false, false], "silence_prob": [73.82, 88.64, 68.15, 45.18, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, [["music", 64.27], ["fly, housefly", 6.82], ["mosquito", 3.33]], null, null], "duration": [5.69, 2.27, 3.9, 25.36, 39.96, 7.08]} \ No newline at end of file diff --git a/annotations_filtered/w-DFg1aS_2E_filtered.json b/annotations_filtered/w-DFg1aS_2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7573fac88b96752a5a7b8316cb2068c474f95c5 --- /dev/null +++ b/annotations_filtered/w-DFg1aS_2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.31], [2.0, 2.47], [5.0, 5.44], [19.0, 18.77], [19.0, 19.53], [25.0, 25.2], [33.0, 33.29], [34.0, 34.48], [35.0, 34.96], [44.0, 44.36], [44.0, 44.79], [47.0, 48.64], [58.0, 59.8], [61.0, 61.72], [62.0, 64.56], [65.0, 66.6], [77.0, 78.22], [84.0, 84.57], [85.0, 85.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.73], ["speech", 17.7], ["musical instrument", 5.89]], null, null, null, null], "duration": [1.31, 0.47, 0.44, -0.23, 0.53, 0.2, 0.29, 0.48, -0.04, 0.36, 0.79, 1.64, 1.8, 0.72, 2.56, 1.6, 1.22, 0.57, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/w0AliJi4npk_filtered.json b/annotations_filtered/w0AliJi4npk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b4e5a8ae750d353ec03ccd4b695933138aa96a1 --- /dev/null +++ b/annotations_filtered/w0AliJi4npk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 44.14], [49.0, 58.19]], "keep_status": [false, false], "silence_prob": [31.36, 28.98], "audiomae_on_audioset": [[["music", 77.77], ["musical instrument", 2.13], ["hum", 1.61]], [["music", 74.1], ["drum machine", 4.91], ["singing", 2.0]]], "duration": [21.14, 9.19]} \ No newline at end of file diff --git a/annotations_filtered/w0BK_hLT-Wo_filtered.json b/annotations_filtered/w0BK_hLT-Wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6791dc1e5ad5962e4bcff3e9c408667f15b6076 --- /dev/null +++ b/annotations_filtered/w0BK_hLT-Wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.85], [20.0, 20.41], [20.0, 20.44], [20.0, 20.48], [20.0, 29.0], [29.0, 34.42], [35.0, 38.7], [41.0, 44.42], [45.0, 50.08], [52.0, 58.06], [59.0, 71.12], [73.0, 89.24], [95.0, 109.98], [111.0, 127.31]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.59, 30.21, 29.85, 30.24, 29.35, 29.18, 29.55, 29.15, 30.18, 29.6], "audiomae_on_audioset": [null, null, null, null, [["music", 33.85], ["throbbing", 21.86], ["speech", 17.8]], [["music", 45.27], ["speech", 29.21], ["cacophony", 9.11]], [["speech", 50.22], ["vehicle", 8.93], ["music", 4.2]], [["music", 66.11], ["cacophony", 3.61], ["electronic music", 3.53]], [["music", 68.76], ["throbbing", 4.57], ["hum", 2.86]], [["hum", 26.16], ["music", 20.24], ["mains hum", 13.83]], [["hum", 34.13], ["mains hum", 27.94], ["throbbing", 23.33]], [["music", 31.52], ["speech", 12.03], ["cacophony", 6.65]], [["music", 74.71], ["throbbing", 4.14], ["cacophony", 3.92]], [["music", 31.74], ["electric shaver, electric razor", 14.22], ["hum", 8.39]]], "duration": [0.85, 0.41, 0.44, 0.48, 9.0, 5.42, 3.7, 3.42, 5.08, 6.06, 12.12, 16.24, 14.98, 16.31]} \ No newline at end of file diff --git a/annotations_filtered/w0NWPKGGFiY_filtered.json b/annotations_filtered/w0NWPKGGFiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaf6749812e83bfb36bce2b73bc73d1060f50bf5 --- /dev/null +++ b/annotations_filtered/w0NWPKGGFiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.99], [9.0, 9.44], [12.0, 14.84], [19.0, 20.6], [27.0, 27.62], [29.0, 30.37], [31.0, 32.51], [38.0, 39.04], [40.0, 40.12], [43.0, 45.4], [47.0, 47.21], [48.0, 49.08], [52.0, 53.33], [54.0, 55.44], [60.0, 63.73], [66.0, 66.6], [70.0, 72.45], [76.0, 76.84], [78.0, 79.68], [82.0, 82.32], [84.0, 84.84], [92.0, 92.04], [95.0, 96.38], [98.0, 98.39], [99.0, 99.47], [102.0, 103.91], [106.0, 107.05], [109.0, 113.97], [115.0, 116.14], [118.0, 118.32], [121.0, 121.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 0.44, 2.84, 1.6, 0.62, 1.37, 1.51, 1.04, 0.12, 2.4, 0.21, 1.08, 1.33, 1.44, 3.73, 0.6, 2.45, 0.84, 1.68, 0.32, 0.84, 0.04, 1.38, 0.39, 0.47, 1.91, 1.05, 4.97, 1.14, 0.32, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/w0X84fml-Bc_filtered.json b/annotations_filtered/w0X84fml-Bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26026a66946e99977a1c1022d57736a6fbda6daa --- /dev/null +++ b/annotations_filtered/w0X84fml-Bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 36.31], [37.0, 69.06], [70.0, 69.96], [72.0, 107.37], [108.0, 111.57], [113.0, 114.34]], "keep_status": [false, false, false, false, false, false], "silence_prob": [98.73, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [5.31, 32.06, -0.04, 35.37, 3.57, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/w0Z44BIDPPc_filtered.json b/annotations_filtered/w0Z44BIDPPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da716763a62e9df10579b56d3f1579f16fe816e8 --- /dev/null +++ b/annotations_filtered/w0Z44BIDPPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 29.69], [31.0, 32.95], [35.0, 41.91], [43.0, 53.64], [57.0, 81.73], [83.0, 112.82], [115.0, 117.17], [123.0, 124.11]], "keep_status": [true, false, false, false, false, true, false, false], "silence_prob": [34.65, 0.0, 50.31, 43.15, 36.87, 30.82, 51.66, 0.0], "audiomae_on_audioset": [[["music", 19.33], ["hum", 18.01], ["synthesizer", 12.54]], null, null, [["hum", 52.86], ["throbbing", 20.75], ["mains hum", 8.88]], [["hum", 34.7], ["music", 22.54], ["throbbing", 13.09]], [["music", 47.17], ["hum", 7.97], ["harmonic", 6.67]], null, null], "duration": [26.69, 1.95, 6.91, 10.64, 24.73, 29.82, 2.17, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/w0cXyGVsUjs_filtered.json b/annotations_filtered/w0cXyGVsUjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84890bbe52b34e260f68d1898cde158f91ed8b13 --- /dev/null +++ b/annotations_filtered/w0cXyGVsUjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.01], [13.0, 13.74], [14.0, 17.64], [20.0, 24.41], [31.0, 31.51], [37.0, 38.18], [39.0, 40.26], [41.0, 42.87], [47.0, 52.42], [54.0, 56.03], [58.0, 58.7], [61.0, 60.93], [66.0, 70.38], [72.0, 73.43], [74.0, 76.4], [79.0, 83.25], [84.0, 85.21], [86.0, 87.79], [90.0, 92.45], [94.0, 95.44], [97.0, 98.68], [101.0, 100.75], [102.0, 104.95], [114.0, 118.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [34.94, 0.0, 32.98, 35.86, 0.0, 0.0, 0.0, 0.0, 37.25, 50.66, 0.0, 0.0, 34.02, 0.0, 38.04, 34.57, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 32.83, 30.29], "audiomae_on_audioset": [[["music", 59.81], ["theremin", 23.16], ["musical instrument", 3.51]], null, [["theremin", 92.33], ["music", 4.57], ["musical instrument", 0.53]], [["theremin", 70.03], ["music", 18.08], ["musical instrument", 2.79]], null, null, null, null, [["theremin", 54.98], ["music", 22.49], ["synthesizer", 2.96]], null, null, null, [["theremin", 72.73], ["music", 13.37], ["speech", 3.49]], null, [["foghorn", 56.93], ["music", 14.38], ["speech", 8.34]], [["foghorn", 53.04], ["music", 13.88], ["speech", 11.94]], null, null, [["theremin", 94.45], ["music", 4.17], ["musical instrument", 0.36]], null, null, null, [["music", 37.82], ["speech", 11.75], ["didgeridoo", 4.54]], [["music", 44.18], ["mains hum", 14.42], ["hum", 10.66]]], "duration": [5.01, 0.74, 3.64, 4.41, 0.51, 1.18, 1.26, 1.87, 5.42, 2.03, 0.7, -0.07, 4.38, 1.43, 2.4, 4.25, 1.21, 1.79, 2.45, 1.44, 1.68, -0.25, 2.95, 4.91]} \ No newline at end of file diff --git a/annotations_filtered/w0l1ukaxeBg_filtered.json b/annotations_filtered/w0l1ukaxeBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65ccab117fae9d4d7f12bdfde285e280e28bd9c8 --- /dev/null +++ b/annotations_filtered/w0l1ukaxeBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [5.0, 5.97], [10.0, 10.4], [12.0, 12.53], [15.0, 16.98], [24.0, 25.05], [27.0, 28.59], [35.0, 35.23], [37.0, 37.23], [38.0, 39.43], [42.0, 42.92], [44.0, 44.81], [46.0, 47.43], [48.0, 65.75], [85.0, 85.87], [98.0, 108.21], [109.0, 109.53], [113.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 34.15, 0.0, 34.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 8.29], ["hum", 5.05], ["noise", 4.86]], null, [["speech", 73.96], ["radio", 6.7], ["horse", 4.47]], null, [["speech", 62.1], ["vehicle", 9.48], ["car", 6.46]]], "duration": [1.05, 0.97, 0.4, 0.53, 1.98, 1.05, 1.59, 0.23, 0.23, 1.43, 0.92, 0.81, 1.43, 17.75, 0.87, 10.21, 0.53, 17.06]} \ No newline at end of file diff --git a/annotations_filtered/w0qfQaJtF2E_filtered.json b/annotations_filtered/w0qfQaJtF2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1e77e59f2898dff492399ea760fa11f0d7e1aa9 --- /dev/null +++ b/annotations_filtered/w0qfQaJtF2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 55.21], [58.0, 69.79], [72.0, 97.61], [99.0, 113.66], [117.0, 130.57], [134.0, 140.9]], "keep_status": [false, true, false, true, false, false], "silence_prob": [31.55, 30.09, 37.24, 35.24, 34.3, 34.27], "audiomae_on_audioset": [[["music", 71.07], ["scary music", 6.23], ["hum", 3.79]], [["music", 37.03], ["speech", 14.29], ["thump, thud", 13.52]], [["music", 53.39], ["hum", 18.8], ["mains hum", 4.92]], [["music", 30.61], ["hum", 26.84], ["mains hum", 11.86]], [["music", 66.17], ["speech", 12.47], ["electronic music", 3.98]], [["music", 48.52], ["hum", 15.07], ["mains hum", 9.42]]], "duration": [21.21, 11.79, 25.61, 14.66, 13.57, 6.9]} \ No newline at end of file diff --git a/annotations_filtered/w13ky72PcKI_filtered.json b/annotations_filtered/w13ky72PcKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9447b0ce4b0317cbbb2ae4812784fc8948332206 --- /dev/null +++ b/annotations_filtered/w13ky72PcKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.78], [10.0, 11.11], [12.0, 13.58], [14.0, 18.59], [25.0, 26.0], [30.0, 31.48], [38.0, 50.63], [53.0, 56.25], [58.0, 82.17], [83.0, 91.08], [93.0, 98.44], [101.0, 104.04]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.64, 0.0, 0.0, 36.22, 47.31, 36.75, 59.42, 46.47, 44.43], "audiomae_on_audioset": [null, null, null, [["mains hum", 23.36], ["hum", 18.76], ["music", 16.12]], null, null, [["music", 67.04], ["speech", 15.4], ["hum", 2.83]], [["hum", 30.49], ["music", 26.61], ["mains hum", 6.26]], [["music", 36.75], ["speech", 26.98], ["hum", 6.72]], null, [["hum", 43.0], ["mains hum", 14.93], ["throbbing", 12.71]], [["whale vocalization", 34.32], ["hum", 23.25], ["mains hum", 14.65]]], "duration": [1.78, 1.11, 1.58, 4.59, 1.0, 1.48, 12.63, 3.25, 24.17, 8.08, 5.44, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/w1pIFZb7480_filtered.json b/annotations_filtered/w1pIFZb7480_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b237bf7296fdbb3e692be12f788daad5723e0566 --- /dev/null +++ b/annotations_filtered/w1pIFZb7480_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [5.0, 5.71], [7.0, 8.24], [9.0, 9.75], [11.0, 11.57], [16.0, 61.1]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.75, 0.71, 1.24, 0.75, 0.57, 45.1]} \ No newline at end of file diff --git a/annotations_filtered/w29PG-8Tywo_filtered.json b/annotations_filtered/w29PG-8Tywo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd102296686b277c5269217feec8c096a31abdf8 --- /dev/null +++ b/annotations_filtered/w29PG-8Tywo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [5.0, 5.81], [7.0, 10.4], [11.0, 12.31], [15.0, 17.15], [24.0, 24.68], [25.0, 24.76], [25.0, 25.69], [31.0, 31.68], [34.0, 34.74], [45.0, 47.24], [50.0, 54.13], [70.0, 71.31], [78.0, 80.37], [80.0, 80.5], [81.0, 81.6], [88.0, 90.1], [91.0, 93.09], [99.0, 103.32], [107.0, 135.65], [137.0, 137.56], [138.0, 139.11], [140.0, 141.49], [142.0, 142.28], [143.0, 143.07], [147.0, 147.19], [176.0, 176.03]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.6, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 40.59, 0.0, 45.11, 0.0, 0.0, 38.41, 38.09, 32.33, 30.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 29.22], ["stomach rumble", 15.48], ["music", 6.95]], null, null, null, null, null, null, null, null, [["thunk", 71.42], ["music", 2.22], ["effects unit", 1.7]], null, [["speech", 19.04], ["fly, housefly", 9.01], ["music", 7.87]], null, null, [["hum", 4.89], ["civil defense siren", 4.05], ["music", 3.2]], [["music", 59.96], ["synthesizer", 12.36], ["cacophony", 6.73]], [["music", 39.37], ["speech", 13.85], ["sidetone", 7.44]], [["speech", 35.37], ["music", 23.3], ["skidding", 6.46]], null, null, null, null, null, null, null], "duration": [0.29, 0.81, 3.4, 1.31, 2.15, 0.68, -0.24, 0.69, 0.68, 0.74, 2.24, 4.13, 1.31, 2.37, 0.5, 0.6, 2.1, 2.09, 4.32, 28.65, 0.56, 1.11, 1.49, 0.28, 0.07, 0.19, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/w2XWa1XuKSI_filtered.json b/annotations_filtered/w2XWa1XuKSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9177fa8a7fd0ac412ad0eacd28ce09b495b57bf7 --- /dev/null +++ b/annotations_filtered/w2XWa1XuKSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.42], [12.0, 13.12], [17.0, 19.2], [22.0, 23.36], [24.0, 25.22], [28.0, 28.71], [34.0, 34.65], [46.0, 46.5], [55.0, 55.93], [62.0, 61.99], [69.0, 76.77], [78.0, 86.21], [87.0, 110.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [99.1, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 63.31, 41.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 21.03], ["mains hum", 15.79], ["buzz", 14.97]], null, [["music", 44.62], ["throbbing", 9.43], ["heart sounds, heartbeat", 6.78]]], "duration": [6.42, 1.12, 2.2, 1.36, 1.22, 0.71, 0.65, 0.5, 0.93, -0.01, 7.77, 8.21, 23.2]} \ No newline at end of file diff --git a/annotations_filtered/w3-V_82VwQQ_filtered.json b/annotations_filtered/w3-V_82VwQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9704eef2b331b4198b7850e47dcc802447f627f6 --- /dev/null +++ b/annotations_filtered/w3-V_82VwQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [3.0, 2.94], [5.0, 5.7], [7.0, 7.82], [10.0, 13.53], [17.0, 19.01], [24.0, 24.12], [44.0, 44.78], [49.0, 49.38], [58.0, 58.51], [60.0, 61.01], [63.0, 63.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.89, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, -0.06, 0.7, 0.82, 3.53, 2.01, 0.12, 0.78, 0.38, 0.51, 1.01, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/w3-djlpw4iw_filtered.json b/annotations_filtered/w3-djlpw4iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/w3-djlpw4iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/w3HklXic1eY_filtered.json b/annotations_filtered/w3HklXic1eY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f04154fdc065af26196cc732704c8dbf7a79df9 --- /dev/null +++ b/annotations_filtered/w3HklXic1eY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [7.0, 7.47], [8.0, 8.56], [10.0, 12.06], [16.0, 16.46], [20.0, 21.56], [30.0, 30.43], [31.0, 32.07], [34.0, 34.5], [35.0, 35.68], [39.0, 100.82], [104.0, 106.2], [108.0, 112.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 62.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.47, 0.56, 2.06, 0.46, 1.56, 0.43, 1.07, 0.5, 0.68, 61.82, 2.2, 4.56]} \ No newline at end of file diff --git a/annotations_filtered/w3hwZ-7CWeg_filtered.json b/annotations_filtered/w3hwZ-7CWeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ccdd586fd5d403978351b95f4aa2bdbf50babae --- /dev/null +++ b/annotations_filtered/w3hwZ-7CWeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 24.49], [25.0, 28.59], [29.0, 50.8], [51.0, 108.28], [111.0, 116.99], [118.0, 120.01], [121.0, 126.23], [128.0, 132.54]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [43.03, 41.93, 44.72, 0.0, 63.64, 97.64, 30.25, 30.48], "audiomae_on_audioset": [[["hum", 34.0], ["mains hum", 17.93], ["music", 9.69]], [["hum", 43.9], ["mains hum", 19.96], ["sidetone", 10.82]], [["hum", 38.27], ["speech", 20.81], ["whale vocalization", 7.59]], null, null, null, [["animal", 24.61], ["speech", 20.09], ["dog", 19.03]], [["dog", 29.15], ["animal", 25.67], ["domestic animals, pets", 19.44]]], "duration": [15.49, 3.59, 21.8, 57.28, 5.99, 2.01, 5.23, 4.54]} \ No newline at end of file diff --git a/annotations_filtered/w3sv1-F1JeI_filtered.json b/annotations_filtered/w3sv1-F1JeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda02d67a7baf73b1d3f906388bed093361c55c0 --- /dev/null +++ b/annotations_filtered/w3sv1-F1JeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.27], [14.0, 14.98], [17.0, 16.6], [18.0, 18.5], [21.0, 21.63], [23.0, 34.05], [36.0, 40.0], [41.0, 41.91], [43.0, 43.58], [46.0, 46.35], [47.0, 48.52], [53.0, 61.67], [65.0, 72.54], [74.0, 74.21], [75.0, 76.2], [77.0, 77.7], [95.0, 96.8], [102.0, 107.13], [126.0, 126.89], [129.0, 129.27], [131.0, 131.35], [135.0, 135.16], [136.0, 139.41], [146.0, 147.14], [151.0, 178.65], [183.0, 183.51]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.57, 58.38, 0.0, 0.0, 0.0, 0.0, 59.68, 34.67, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 31.21, 0.0, 31.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 27.53], ["music", 14.77], ["mains hum", 13.47]], null, null, null, null, null, null, [["speech", 53.39], ["sidetone", 10.51], ["dial tone", 7.62]], null, null, null, null, null, null, null, null, null, [["speech", 40.35], ["music", 11.99], ["rumble", 5.58]], null, [["explosion", 52.47], ["speech", 15.38], ["burst, pop", 6.95]], null], "duration": [0.27, 0.98, -0.4, 0.5, 0.63, 11.05, 4.0, 0.91, 0.58, 0.35, 1.52, 8.67, 7.54, 0.21, 1.2, 0.7, 1.8, 5.13, 0.89, 0.27, 0.35, 0.16, 3.41, 1.14, 27.65, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/w4-b-D0iByQ_filtered.json b/annotations_filtered/w4-b-D0iByQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae535ec151104992897f26109b7dd948784fcdae --- /dev/null +++ b/annotations_filtered/w4-b-D0iByQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [4.0, 4.99], [8.0, 8.34], [11.0, 10.84], [11.0, 11.43], [13.0, 14.39], [20.0, 20.43], [21.0, 21.73], [22.0, 22.72], [26.0, 25.98], [32.0, 32.61], [41.0, 41.61], [43.0, 43.97], [48.0, 49.22], [51.0, 51.36], [52.0, 59.9], [62.0, 62.88], [69.0, 69.25], [70.0, 70.34], [72.0, 72.72], [74.0, 90.76], [96.0, 100.18], [104.0, 106.39], [107.0, 108.01], [109.0, 109.9], [113.0, 113.61], [115.0, 117.66], [119.0, 120.21], [128.0, 129.49], [132.0, 132.71], [134.0, 134.81], [138.0, 138.57], [141.0, 145.47], [148.0, 147.92], [148.0, 148.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 77.87, 100.0, 94.66, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 0.99, 0.34, -0.16, 0.43, 1.39, 0.43, 0.73, 0.72, -0.02, 0.61, 0.61, 0.97, 1.22, 0.36, 7.9, 0.88, 0.25, 0.34, 0.72, 16.76, 4.18, 2.39, 1.01, 0.9, 0.61, 2.66, 1.21, 1.49, 0.71, 0.81, 0.57, 4.47, -0.08, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/w424xCe0eGQ_filtered.json b/annotations_filtered/w424xCe0eGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa9afa5f95c6441817fe64ee5e53cf8366429b8d --- /dev/null +++ b/annotations_filtered/w424xCe0eGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [4.0, 5.26], [7.0, 9.26], [14.0, 16.31], [19.0, 19.58], [23.0, 25.69], [26.0, 27.77], [30.0, 32.46], [33.0, 33.61], [36.0, 36.05], [39.0, 40.71], [41.0, 50.92], [54.0, 56.84], [59.0, 61.55], [64.0, 65.72], [67.0, 68.79], [71.0, 74.95], [77.0, 76.77], [79.0, 83.96], [89.0, 91.03], [95.0, 95.22], [97.0, 102.74], [105.0, 107.16], [111.0, 135.97], [138.0, 140.19], [141.0, 145.61]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, true, true, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 40.17, 39.11, 0.0, 40.52, 0.0, 42.0, 0.0, 0.0, 0.0, 33.58, 34.37, 35.15, 0.0, 0.0, 37.43, 0.0, 32.36, 30.64, 0.0, 31.89, 33.86, 31.99, 35.59, 38.59], "audiomae_on_audioset": [null, null, [["music", 37.83], ["speech", 28.92], ["hum", 8.84]], [["hum", 32.74], ["throbbing", 18.48], ["music", 16.93]], null, [["speech", 40.59], ["music", 35.71], ["hum", 7.84]], null, [["music", 35.37], ["didgeridoo", 14.97], ["theremin", 7.62]], null, null, null, [["music", 40.22], ["synthesizer", 21.26], ["speech", 8.89]], [["music", 45.27], ["marimba, xylophone", 6.59], ["musical instrument", 5.59]], [["music", 59.47], ["speech", 9.31], ["musical instrument", 4.82]], null, null, [["music", 44.85], ["speech", 15.82], ["hum", 5.17]], null, [["music", 34.43], ["speech", 6.69], ["quack", 5.86]], [["music", 51.5], ["vibraphone", 10.14], ["musical instrument", 7.89]], null, [["music", 54.26], ["musical instrument", 11.18], ["harmonic", 3.97]], [["music", 37.49], ["percussion", 10.88], ["musical instrument", 9.78]], [["music", 68.82], ["musical instrument", 7.71], ["marimba, xylophone", 1.68]], [["music", 48.22], ["throbbing", 19.11], ["hum", 11.09]], [["music", 23.91], ["vibraphone", 19.93], ["marimba, xylophone", 14.16]]], "duration": [0.79, 1.26, 2.26, 2.31, 0.58, 2.69, 1.77, 2.46, 0.61, 0.05, 1.71, 9.92, 2.84, 2.55, 1.72, 1.79, 3.95, -0.23, 4.96, 2.03, 0.22, 5.74, 2.16, 24.97, 2.19, 4.61]} \ No newline at end of file diff --git a/annotations_filtered/w4TCxFKaqIw_filtered.json b/annotations_filtered/w4TCxFKaqIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac71cfe1770390f8d6b553ce31058a3d71af2c42 --- /dev/null +++ b/annotations_filtered/w4TCxFKaqIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.4], [29.0, 29.86], [31.0, 32.54], [33.0, 34.13], [36.0, 45.18], [46.0, 47.24], [52.0, 53.42], [58.0, 61.38], [63.0, 63.46], [67.0, 69.43], [70.0, 73.79], [74.0, 76.4], [77.0, 79.69], [83.0, 83.83], [92.0, 92.43], [97.0, 97.44], [98.0, 98.46], [99.0, 99.89], [101.0, 102.32], [104.0, 104.8], [106.0, 106.51]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [36.31, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 33.71, 0.0, 36.78, 42.91, 39.22, 36.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.32], ["knock", 11.39], ["brass instrument", 3.79]], null, null, null, null, null, null, [["throbbing", 19.78], ["speech", 8.37], ["heart sounds, heartbeat", 6.49]], null, [["speech", 47.44], ["radio", 26.04], ["vehicle", 4.5]], [["speech", 41.07], ["music", 27.18], ["hum", 8.78]], [["hum", 20.39], ["mains hum", 17.61], ["didgeridoo", 13.11]], [["speech", 36.13], ["music", 23.45], ["didgeridoo", 9.68]], null, null, null, null, null, null, null, null], "duration": [5.4, 0.86, 1.54, 1.13, 9.18, 1.24, 1.42, 3.38, 0.46, 2.43, 3.79, 2.4, 2.69, 0.83, 0.43, 0.44, 0.46, 0.89, 1.32, 0.8, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/w4i_ZwMT3H0_filtered.json b/annotations_filtered/w4i_ZwMT3H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9557478bb788bc795e49b4d99a9507610d9df385 --- /dev/null +++ b/annotations_filtered/w4i_ZwMT3H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 4.94], [6.0, 6.72], [10.0, 11.42], [12.0, 14.18], [15.0, 16.23], [17.0, 17.9], [18.0, 19.8], [21.0, 22.28], [23.0, 24.12], [25.0, 26.03], [26.0, 26.74], [28.0, 28.58], [29.0, 29.67], [31.0, 31.7], [32.0, 35.31], [39.0, 45.49], [46.0, 48.29], [52.0, 61.2], [63.0, 64.5], [67.0, 68.27], [71.0, 72.42], [75.0, 75.25], [78.0, 91.98], [93.0, 100.65], [101.0, 106.71], [111.0, 110.76], [111.0, 111.23], [112.0, 112.51], [113.0, 115.64], [116.0, 116.9], [123.0, 123.85], [124.0, 125.36], [128.0, 130.72], [135.0, 135.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 96.42, 88.1, 86.64, 0.0, 0.0, 0.0, 0.0, 44.49, 37.16, 39.12, 0.0, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 37.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.74], ["hum", 5.43], ["electronic music", 4.63]], [["music", 36.7], ["theremin", 29.22], ["musical instrument", 5.15]], [["hum", 16.02], ["thunk", 12.9], ["music", 10.26]], null, null, null, [["music", 40.78], ["speech", 35.34], ["radio", 3.32]], null, null, null, [["music", 39.73], ["theremin", 12.43], ["musical instrument", 8.82]], null], "duration": [1.18, -0.06, 0.72, 1.42, 2.18, 1.23, 0.9, 1.8, 1.28, 1.12, 1.03, 0.74, 0.58, 0.67, 0.7, 3.31, 6.49, 2.29, 9.2, 1.5, 1.27, 1.42, 0.25, 13.98, 7.65, 5.71, -0.24, 0.23, 0.51, 2.64, 0.9, 0.85, 1.36, 2.72, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/w4liPmQEPEU_filtered.json b/annotations_filtered/w4liPmQEPEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f2303e42902695c6822661defc17a169d41bab7 --- /dev/null +++ b/annotations_filtered/w4liPmQEPEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.79], [9.0, 10.61], [13.0, 14.28], [16.0, 16.87], [20.0, 20.58], [22.0, 23.21], [26.0, 26.35], [30.0, 31.19], [35.0, 44.66], [45.0, 45.67], [46.0, 47.76], [49.0, 49.86], [51.0, 54.84], [56.0, 56.39], [57.0, 116.51], [119.0, 119.13], [119.0, 153.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.03, 0.0, 0.0, 0.0, 42.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 37.35], ["hum", 17.27], ["breaking", 13.43]], null, null, null, [["music", 56.47], ["hum", 9.19], ["mains hum", 4.33]], null, null, null, null], "duration": [-0.21, 1.61, 1.28, 0.87, 0.58, 1.21, 0.35, 1.19, 9.66, 0.67, 1.76, 0.86, 3.84, 0.39, 59.51, 0.13, 34.28]} \ No newline at end of file diff --git a/annotations_filtered/w57ga2Yiic4_filtered.json b/annotations_filtered/w57ga2Yiic4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96624820084200c8258cb3b4ff4c99f3d08e5e94 --- /dev/null +++ b/annotations_filtered/w57ga2Yiic4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [9.0, 15.21], [16.0, 18.15], [19.0, 20.85], [22.0, 22.94], [24.0, 26.77], [30.0, 30.72], [32.0, 32.46], [33.0, 37.66], [38.0, 66.16], [69.0, 76.91], [80.0, 83.3], [84.0, 86.66], [90.0, 103.5], [105.0, 112.87], [115.0, 116.72], [117.0, 130.74], [132.0, 134.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.73, 99.73, 0.0, 0.0, 99.96, 0.0, 0.0, 98.36, 94.22, 98.36, 98.99, 97.43, 93.13, 99.96, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 6.21, 2.15, 1.85, 0.94, 2.77, 0.72, 0.46, 4.66, 28.16, 7.91, 3.3, 2.66, 13.5, 7.87, 1.72, 13.74, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/w5EQRIoHjQg_filtered.json b/annotations_filtered/w5EQRIoHjQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/w5EQRIoHjQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/w5PGP9-_x5E_filtered.json b/annotations_filtered/w5PGP9-_x5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ae7cc86a712b0e0f595992c37ac24bdc5b70151 --- /dev/null +++ b/annotations_filtered/w5PGP9-_x5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.07], [29.0, 29.67], [31.0, 32.21], [68.0, 72.06], [73.0, 73.77], [76.0, 76.33], [77.0, 77.85], [82.0, 81.97], [98.0, 97.66], [98.0, 98.66], [121.0, 121.86], [125.0, 125.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 77.33], ["noise", 3.67], ["beatboxing", 3.12]], null, null, null, null, null, null, null, null], "duration": [0.07, 0.67, 1.21, 4.06, 0.77, 0.33, 0.85, -0.03, -0.34, 0.66, 0.86, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/w5mtX7FnO3M_filtered.json b/annotations_filtered/w5mtX7FnO3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7d19a7c8d3684f230d69bb1a174b8740f307588 --- /dev/null +++ b/annotations_filtered/w5mtX7FnO3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [5.0, 5.39], [6.0, 7.25], [8.0, 8.4], [10.0, 22.28], [23.0, 24.92], [28.0, 44.41], [48.0, 48.88], [50.0, 50.99], [52.0, 53.38], [55.0, 55.39], [57.0, 56.96], [59.0, 61.52], [63.0, 79.07], [80.0, 106.93], [110.0, 113.66], [115.0, 117.66], [120.0, 121.51], [122.0, 122.1], [122.0, 125.44], [133.0, 133.68], [136.0, 136.22], [140.0, 140.53], [142.0, 147.92], [150.0, 151.85], [152.0, 160.73], [162.0, 162.36], [163.0, 171.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 0.0, 0.0, 87.55, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 93.6, 98.27, 90.78, 98.51, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 71.87, 0.0, 73.36, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.33, 0.39, 1.25, 0.4, 12.28, 1.92, 16.41, 0.88, 0.99, 1.38, 0.39, -0.04, 2.52, 16.07, 26.93, 3.66, 2.66, 1.51, 0.1, 3.44, 0.68, 0.22, 0.53, 5.92, 1.85, 8.73, 0.36, 8.05]} \ No newline at end of file diff --git a/annotations_filtered/w5oWgKtku3Q_filtered.json b/annotations_filtered/w5oWgKtku3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f900a93fea05cb3652e0d851362bd923d4f275aa --- /dev/null +++ b/annotations_filtered/w5oWgKtku3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [8.0, 7.52], [8.0, 9.44], [19.0, 21.34], [22.0, 24.75], [26.0, 29.54], [30.0, 41.82], [42.0, 42.55], [48.0, 49.17], [50.0, 54.53], [57.0, 57.35], [63.0, 68.79], [78.0, 79.15], [82.0, 83.83], [87.0, 89.58], [90.0, 94.73], [96.0, 108.46], [109.0, 113.54], [115.0, 118.18], [122.0, 122.49], [124.0, 124.31]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.17, 97.54, 70.16, 31.26, 0.0, 0.0, 47.94, 0.0, 76.86, 0.0, 0.0, 83.52, 43.71, 30.25, 28.99, 29.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 28.45], ["whack, thwack", 17.1], ["speech", 6.04]], null, null, [["speech", 39.31], ["sine wave", 23.58], ["chirp tone", 10.52]], null, null, null, null, null, [["music", 33.22], ["speech", 29.15], ["musical instrument", 5.9]], [["heart sounds, heartbeat", 59.04], ["throbbing", 16.01], ["hum", 8.7]], [["hum", 50.34], ["throbbing", 33.94], ["speech", 6.91]], [["hum", 40.08], ["throbbing", 27.44], ["music", 11.86]], null, null], "duration": [0.45, -0.48, 1.44, 2.34, 2.75, 3.54, 11.82, 0.55, 1.17, 4.53, 0.35, 5.79, 1.15, 1.83, 2.58, 4.73, 12.46, 4.54, 3.18, 0.49, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/w5pn48wzBuw_filtered.json b/annotations_filtered/w5pn48wzBuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6afeaa4195f14db27775fd5beb30055aadd71e5d --- /dev/null +++ b/annotations_filtered/w5pn48wzBuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.01], [21.0, 26.05], [28.0, 35.83], [42.0, 42.75], [44.0, 72.15]], "keep_status": [true, false, true, false, true], "silence_prob": [34.71, 30.61, 30.64, 0.0, 33.06], "audiomae_on_audioset": [[["speech", 43.19], ["mains hum", 11.06], ["hum", 7.42]], [["music", 54.96], ["speech", 11.69], ["didgeridoo", 9.09]], [["theremin", 20.8], ["hum", 18.23], ["music", 16.26]], null, [["gong", 21.49], ["speech", 15.0], ["mains hum", 13.97]]], "duration": [2.01, 5.05, 7.83, 0.75, 28.15]} \ No newline at end of file diff --git a/annotations_filtered/w5yJV_TKOWg_filtered.json b/annotations_filtered/w5yJV_TKOWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185fa79e73dc75766f0531f8c871cf9ad04f2961 --- /dev/null +++ b/annotations_filtered/w5yJV_TKOWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.71], [2.0, 4.4], [5.0, 6.32], [26.0, 43.41], [45.0, 45.52], [47.0, 48.36], [51.0, 51.29], [53.0, 56.74], [67.0, 68.66], [70.0, 95.88], [97.0, 97.58], [99.0, 107.01], [110.0, 111.27], [114.0, 121.09]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 58.64, 0.0, 29.63, 0.0, 0.0, 0.0, 28.74, 0.0, 28.8, 0.0, 28.59, 0.0, 28.73], "audiomae_on_audioset": [null, null, null, [["speech", 64.33], ["music", 11.25], ["hum", 5.16]], null, null, null, [["throbbing", 33.48], ["hum", 26.93], ["music", 17.35]], null, [["speech", 24.77], ["music", 21.28], ["outside, rural or natural", 7.04]], null, [["music", 30.67], ["speech", 20.92], ["groan", 5.44]], null, [["speech", 42.58], ["music", 6.83], ["explosion", 5.19]]], "duration": [0.71, 2.4, 1.32, 17.41, 0.52, 1.36, 0.29, 3.74, 1.66, 25.88, 0.58, 8.01, 1.27, 7.09]} \ No newline at end of file diff --git a/annotations_filtered/w610fTL5O-A_filtered.json b/annotations_filtered/w610fTL5O-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4348fc00d75f1b5ceae60f29b8ab18a957e2d860 --- /dev/null +++ b/annotations_filtered/w610fTL5O-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [4.0, 5.09], [7.0, 6.96], [8.0, 11.16], [13.0, 14.49], [15.0, 15.43], [18.0, 25.0], [28.0, 38.4], [40.0, 45.93], [47.0, 47.66], [52.0, 51.9], [52.0, 78.36]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 99.94, 42.55, 44.04, 0.0, 0.0, 32.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 28.28], ["gunshot, gunfire", 12.02], ["machine gun", 11.23]], [["thunk", 53.85], ["speech", 15.72], ["hum", 4.26]], null, null, [["speech", 36.39], ["mains hum", 21.82], ["hum", 13.89]]], "duration": [0.2, 1.09, -0.04, 3.16, 1.49, 0.43, 7.0, 10.4, 5.93, 0.66, -0.1, 26.36]} \ No newline at end of file diff --git a/annotations_filtered/w6RItV0ZDgI_filtered.json b/annotations_filtered/w6RItV0ZDgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5631de4a5902e9bbe67d470dd874d0aa639cedf --- /dev/null +++ b/annotations_filtered/w6RItV0ZDgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.04], [50.0, 50.36], [53.0, 53.86], [58.0, 60.84], [61.0, 61.8], [64.0, 64.45], [93.0, 93.33], [95.0, 95.77], [109.0, 109.22], [142.0, 142.53], [144.0, 143.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["chirp tone", 69.83], ["sine wave", 13.31], ["speech", 6.4]], null, null, null, null, null, null, null], "duration": [0.04, 0.36, 0.86, 2.84, 0.8, 0.45, 0.33, 0.77, 0.22, 0.53, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/w6USFL0JYAU_filtered.json b/annotations_filtered/w6USFL0JYAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d4beb1099644efdd2d70d8aabb9ed3ced931dc --- /dev/null +++ b/annotations_filtered/w6USFL0JYAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.28], [25.0, 33.66], [34.0, 35.36], [36.0, 39.51], [41.0, 43.28], [45.0, 44.63], [57.0, 60.56], [74.0, 93.5], [110.0, 110.62], [127.0, 130.23], [132.0, 135.36], [137.0, 137.29], [140.0, 141.89], [142.0, 143.45], [144.0, 145.69], [147.0, 149.05], [150.0, 150.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.92, 34.07, 0.0, 36.25, 49.54, 0.0, 50.66, 31.09, 0.0, 69.07, 36.13, 0.0, 0.0, 0.0, 0.0, 41.1, 0.0], "audiomae_on_audioset": [null, [["music", 71.62], ["theremin", 4.68], ["musical instrument", 4.47]], null, [["music", 58.23], ["theremin", 6.96], ["musical instrument", 4.89]], [["music", 44.44], ["ambient music", 4.54], ["theremin", 4.31]], null, null, [["music", 76.7], ["boing", 2.25], ["animal", 2.17]], null, null, [["music", 56.65], ["groan", 10.81], ["screaming", 6.34]], null, null, null, null, [["music", 44.23], ["thunk", 44.23], ["ice cream truck, ice cream van", 1.09]], null], "duration": [2.28, 8.66, 1.36, 3.51, 2.28, -0.37, 3.56, 19.5, 0.62, 3.23, 3.36, 0.29, 1.89, 1.45, 1.69, 2.05, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/w6YTq-3hmnA_filtered.json b/annotations_filtered/w6YTq-3hmnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88d6fdb76fdeb5841fc91c40554eff10ad85be35 --- /dev/null +++ b/annotations_filtered/w6YTq-3hmnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [9.0, 9.27], [14.0, 15.57], [18.0, 18.82], [31.0, 31.29], [33.0, 34.65], [76.0, 76.76], [82.0, 85.18], [93.0, 94.49], [101.0, 101.39], [105.0, 105.56], [114.0, 115.16], [118.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.08, 0.0, 0.0, 0.0, 0.0, 48.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["breaking", 33.67], ["speech", 14.91], ["tuning fork", 12.92]], null, null, null, null, [["music", 62.23], ["throbbing", 5.61], ["hum", 3.09]]], "duration": [0.51, 0.27, 1.57, 0.82, 0.29, 1.65, 0.76, 3.18, 1.49, 0.39, 0.56, 1.16, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/w6ivjvOqBy0_filtered.json b/annotations_filtered/w6ivjvOqBy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61b8baae16117694ea5b57ebe074f28b20b5ffa8 --- /dev/null +++ b/annotations_filtered/w6ivjvOqBy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [14.0, 15.58], [19.0, 18.72], [20.0, 20.95], [24.0, 24.63], [25.0, 25.86], [36.0, 36.66], [39.0, 43.31], [70.0, 71.29], [78.0, 78.83], [79.0, 80.38], [88.0, 91.66], [101.0, 101.04], [101.0, 101.73], [102.0, 102.68], [104.0, 103.89], [107.0, 115.33], [117.0, 121.56], [122.0, 122.66], [123.0, 134.35], [136.0, 138.89], [148.0, 164.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 30.38, 31.12, 0.0, 28.97, 28.89, 29.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 51.8], ["thunk", 11.68], ["whack, thwack", 8.18]], null, null, null, [["music", 33.06], ["speech", 25.43], ["theremin", 10.59]], null, null, null, null, [["whale vocalization", 51.66], ["cattle, bovinae", 13.68], ["moo", 10.43]], [["speech", 47.45], ["music", 18.64], ["explosion", 7.85]], null, [["mosquito", 57.38], ["fly, housefly", 27.18], ["insect", 14.71]], [["speech", 58.46], ["vehicle", 10.17], ["car", 3.09]], [["livestock, farm animals, working animals", 41.32], ["cattle, bovinae", 17.85], ["moo", 13.53]]], "duration": [1.29, 1.58, -0.28, 0.95, 0.63, 0.86, 0.66, 4.31, 1.29, 0.83, 1.38, 3.66, 0.04, 0.73, 0.68, -0.11, 8.33, 4.56, 0.66, 11.35, 2.89, 16.73]} \ No newline at end of file diff --git a/annotations_filtered/w6kumXHaOeI_filtered.json b/annotations_filtered/w6kumXHaOeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..681b3336f9cd339792b7241cd5f7e7b2a42b6c01 --- /dev/null +++ b/annotations_filtered/w6kumXHaOeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.75], [5.0, 5.53], [7.0, 7.5], [9.0, 10.13], [11.0, 13.09], [15.0, 15.21], [20.0, 20.01], [23.0, 23.63], [25.0, 25.84], [27.0, 27.24], [29.0, 29.98], [31.0, 31.5], [33.0, 34.75], [36.0, 36.78], [38.0, 39.39], [40.0, 41.71], [46.0, 46.48], [47.0, 47.51], [50.0, 56.35], [59.0, 58.95], [60.0, 60.25], [63.0, 62.99], [63.0, 64.35], [65.0, 65.57], [67.0, 67.53], [68.0, 68.57], [73.0, 74.16], [75.0, 75.59], [78.0, 79.27], [80.0, 81.35], [83.0, 84.64], [85.0, 85.18], [87.0, 88.7], [90.0, 90.71], [93.0, 93.63], [96.0, 97.04], [98.0, 98.56], [100.0, 102.29], [105.0, 106.44], [107.0, 107.7], [108.0, 110.91], [114.0, 113.75], [114.0, 118.29], [122.0, 122.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.51, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 84.8, 0.0, 52.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.75, 0.53, 0.5, 1.13, 2.09, 0.21, 0.01, 0.63, 0.84, 0.24, 0.98, 0.5, 1.75, 0.78, 1.39, 1.71, 0.48, 0.51, 6.35, -0.05, 0.25, -0.01, 1.35, 0.57, 0.53, 0.57, 1.16, 0.59, 1.27, 1.35, 1.64, 0.18, 1.7, 0.71, 0.63, 1.04, 0.56, 2.29, 1.44, 0.7, 2.91, -0.25, 4.29, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/w6n3WpRNWTs_filtered.json b/annotations_filtered/w6n3WpRNWTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd796b05268e5a96ed3227b9a7bf808c914d398 --- /dev/null +++ b/annotations_filtered/w6n3WpRNWTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.35], [13.0, 12.87], [13.0, 13.86], [15.0, 15.08], [17.0, 17.17], [29.0, 28.86], [31.0, 32.48], [34.0, 47.29], [51.0, 51.75], [52.0, 53.06], [60.0, 62.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 96.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.35, -0.13, 0.86, 0.08, 0.17, -0.14, 1.48, 13.29, 0.75, 1.06, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/w6zGX2qpxzU_filtered.json b/annotations_filtered/w6zGX2qpxzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fd1b3d0a0bba98627ee72a4623ba6d8c1949fcb --- /dev/null +++ b/annotations_filtered/w6zGX2qpxzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.16], [27.0, 27.8], [41.0, 42.21], [45.0, 45.1], [48.0, 48.83], [50.0, 49.96], [52.0, 53.01], [67.0, 67.8], [77.0, 77.16], [81.0, 81.85], [83.0, 83.47], [86.0, 86.76], [90.0, 91.17], [97.0, 97.17], [99.0, 100.43], [105.0, 106.52], [107.0, 108.95], [119.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.8, 1.21, 0.1, 0.83, -0.04, 1.01, 0.8, 0.16, 0.85, 0.47, 0.76, 1.17, 0.17, 1.43, 1.52, 1.95, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/w71n9tHYuIw_filtered.json b/annotations_filtered/w71n9tHYuIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f5c9435082a65628ebc2913b5229c2b84cf9835 --- /dev/null +++ b/annotations_filtered/w71n9tHYuIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.8], [20.0, 20.55], [22.0, 22.18], [23.0, 23.6], [27.0, 28.41], [29.0, 31.09], [31.0, 37.93], [38.0, 38.35], [39.0, 42.55], [45.0, 44.98], [52.0, 52.64], [61.0, 61.8], [73.0, 73.68], [75.0, 74.98], [76.0, 95.54], [96.0, 98.51], [99.0, 102.0], [103.0, 107.08], [108.0, 110.96], [112.0, 114.88], [116.0, 120.23], [121.0, 128.31], [129.0, 128.8], [129.0, 128.83], [129.0, 128.9], [129.0, 128.97], [129.0, 129.0], [129.0, 129.07]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 60.98, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 99.71, 99.99, 100.0, 100.0, 100.0, 100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.2], ["electric shaver, electric razor", 4.15], ["inside, small room", 3.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.55, 0.18, 0.6, 1.41, 2.09, 6.93, 0.35, 3.55, -0.02, 0.64, 0.8, 0.68, -0.02, 19.54, 2.51, 3.0, 4.08, 2.96, 2.88, 4.23, 7.31, -0.2, -0.17, -0.1, -0.03, 0.0, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/w71pHLUz2i0_filtered.json b/annotations_filtered/w71pHLUz2i0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db33a535edc9f50ea7f500403ba8d725369b8be8 --- /dev/null +++ b/annotations_filtered/w71pHLUz2i0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 8.58], [10.0, 10.25], [14.0, 14.89], [16.0, 18.55], [20.0, 20.55], [21.0, 21.36], [23.0, 23.89], [31.0, 31.56], [32.0, 35.67], [44.0, 44.37], [46.0, 47.87], [53.0, 54.46], [62.0, 63.21], [65.0, 66.82], [69.0, 76.5], [84.0, 88.01], [89.0, 91.05], [92.0, 97.23], [102.0, 111.94], [115.0, 116.53], [121.0, 121.34], [122.0, 123.33], [125.0, 126.57], [129.0, 130.45], [132.0, 133.34], [134.0, 136.38], [137.0, 137.76], [138.0, 138.74]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.35, 0.0, 0.0, 29.99, 0.0, 0.0, 0.0, 0.0, 30.55, 0.0, 0.0, 0.0, 0.0, 0.0, 33.25, 50.91, 44.34, 41.5, 32.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 34.63], ["hum", 14.15], ["music", 11.36]], null, null, [["speech", 37.42], ["boing", 19.26], ["music", 14.68]], null, null, null, null, [["music", 27.3], ["speech", 22.08], ["boing", 20.32]], null, null, null, null, null, [["boing", 43.5], ["speech", 25.43], ["music", 15.83]], null, [["music", 66.59], ["didgeridoo", 3.65], ["musical instrument", 2.62]], [["music", 45.92], ["speech", 16.95], ["hum", 9.86]], [["mosquito", 21.4], ["music", 15.77], ["fly, housefly", 8.58]], null, null, null, null, null, null, null, null, null], "duration": [0.43, 2.58, 0.25, 0.89, 2.55, 0.55, 0.36, 0.89, 0.56, 3.67, 0.37, 1.87, 1.46, 1.21, 1.82, 7.5, 4.01, 2.05, 5.23, 9.94, 1.53, 0.34, 1.33, 1.57, 1.45, 1.34, 2.38, 0.76, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/w7ZY9tqDsEc_filtered.json b/annotations_filtered/w7ZY9tqDsEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0853b64d4f17916830680df2beba87f7ca6230f9 --- /dev/null +++ b/annotations_filtered/w7ZY9tqDsEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.32], [8.0, 9.59], [14.0, 16.6], [20.0, 21.14], [23.0, 26.22], [27.0, 28.17], [29.0, 30.11], [31.0, 35.48], [36.0, 37.93], [41.0, 41.82], [43.0, 45.76], [47.0, 50.04], [51.0, 53.08], [54.0, 55.76], [58.0, 57.67], [58.0, 60.17], [62.0, 64.08], [65.0, 65.94], [67.0, 69.26], [70.0, 71.27], [72.0, 72.18], [73.0, 74.04], [75.0, 78.16], [81.0, 82.11], [83.0, 83.35], [84.0, 86.81], [87.0, 90.26], [92.0, 100.33], [102.0, 102.88], [104.0, 108.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 97.92, 0.0, 0.0, 100.0, 0.0, 0.0, 99.99, 76.7, 100.0, 0.0, 0.0, 98.99, 75.72, 0.0, 99.99, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 96.54, 99.59, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.32, 1.59, 2.6, 1.14, 3.22, 1.17, 1.11, 4.48, 1.93, 0.82, 2.76, 3.04, 2.08, 1.76, -0.33, 2.17, 2.08, 0.94, 2.26, 1.27, 0.18, 1.04, 3.16, 1.11, 0.35, 2.81, 3.26, 8.33, 0.88, 4.31]} \ No newline at end of file diff --git a/annotations_filtered/w7ngnhj4snE_filtered.json b/annotations_filtered/w7ngnhj4snE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c845da5f0d63b5aab3c5358d534cfd3807005d63 --- /dev/null +++ b/annotations_filtered/w7ngnhj4snE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [4.0, 4.23], [4.0, 6.86], [7.0, 9.32], [16.0, 18.93], [24.0, 24.71], [32.0, 32.34], [33.0, 33.88], [37.0, 38.2], [41.0, 44.19], [56.0, 56.79], [63.0, 65.65], [66.0, 75.24], [79.0, 82.41], [83.0, 85.45], [86.0, 86.09], [86.0, 92.16], [94.0, 95.44], [98.0, 98.41], [99.0, 99.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.95, 99.73, 86.82, 0.0, 0.0, 0.0, 0.0, 41.62, 0.0, 64.86, 79.41, 64.97, 52.39, 0.0, 53.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 42.33], ["moo", 36.52], ["livestock, farm animals, working animals", 20.64]], null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.23, 2.86, 2.32, 2.93, 0.71, 0.34, 0.88, 1.2, 3.19, 0.79, 2.65, 9.24, 3.41, 2.45, 0.09, 6.16, 1.44, 0.41, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/w7tqVEdyteg_filtered.json b/annotations_filtered/w7tqVEdyteg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2142b30378bd924f3e0f568aafafbbbe68d8927f --- /dev/null +++ b/annotations_filtered/w7tqVEdyteg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 93.53], [98.0, 98.05]], "keep_status": [false, false], "silence_prob": [68.41, 0.0], "audiomae_on_audioset": [null, null], "duration": [8.53, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/w80ZSg7kNbE_filtered.json b/annotations_filtered/w80ZSg7kNbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ed5cb3757aae95ea5319557abd9cb65bc95c21 --- /dev/null +++ b/annotations_filtered/w80ZSg7kNbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [11.0, 14.0], [16.0, 17.41], [18.0, 19.25], [20.0, 21.39], [25.0, 26.96], [45.0, 45.47], [49.0, 58.95], [59.0, 71.36], [73.0, 74.58], [76.0, 77.03], [78.0, 78.04], [80.0, 85.58], [87.0, 87.84], [90.0, 92.82], [93.0, 94.51], [98.0, 99.1], [104.0, 110.56], [111.0, 123.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 30.78, 33.69, 0.0, 0.0, 0.0, 99.93, 0.0, 88.28, 0.0, 0.0, 87.37, 52.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 47.06], ["brass instrument", 5.38], ["trombone", 4.37]], [["music", 63.56], ["musical instrument", 4.84], ["effects unit", 4.21]], null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 3.0, 1.41, 1.25, 1.39, 1.96, 0.47, 9.95, 12.36, 1.58, 1.03, 0.04, 5.58, 0.84, 2.82, 1.51, 1.1, 6.56, 12.47]} \ No newline at end of file diff --git a/annotations_filtered/w80bZTK88mc_filtered.json b/annotations_filtered/w80bZTK88mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fe8b9147fc7627ba8e8f25387601c16d0775c6e --- /dev/null +++ b/annotations_filtered/w80bZTK88mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.67], [21.0, 24.92], [26.0, 43.92]], "keep_status": [false, false, true], "silence_prob": [0.0, 100.0, 48.35], "audiomae_on_audioset": [null, null, [["speech", 31.98], ["insect", 11.24], ["cricket", 10.61]]], "duration": [0.67, 3.92, 17.92]} \ No newline at end of file diff --git a/annotations_filtered/w86nTX6Iixo_filtered.json b/annotations_filtered/w86nTX6Iixo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60880ae2df0e1339ac4d6aa4b397cbd925cd31e1 --- /dev/null +++ b/annotations_filtered/w86nTX6Iixo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [5.0, 8.61], [11.0, 30.99], [32.0, 32.97], [35.0, 34.67], [36.0, 36.63], [37.0, 37.76], [38.0, 40.26], [42.0, 42.48], [44.0, 48.47], [50.0, 49.86], [50.0, 51.38], [55.0, 56.1], [59.0, 61.94], [62.0, 63.54], [64.0, 65.2], [71.0, 81.73], [82.0, 82.56], [86.0, 86.46], [89.0, 92.08], [94.0, 98.79], [102.0, 102.76], [109.0, 110.52], [111.0, 112.19], [115.0, 116.13], [129.0, 131.62], [135.0, 135.3]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 33.14, 31.55, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 50.71, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 74.92, 0.0, 0.0, 31.43, 34.49, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0], "audiomae_on_audioset": [null, [["speech", 43.71], ["music", 16.66], ["groan", 3.14]], [["music", 37.31], ["buzz", 14.9], ["didgeridoo", 5.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.89], ["theremin", 8.85], ["whale vocalization", 4.49]], [["music", 47.81], ["theremin", 6.43], ["crowd", 4.5]], null, null, null, null, null, null], "duration": [-0.07, 3.61, 19.99, 0.97, -0.33, 0.63, 0.76, 2.26, 0.48, 4.47, -0.14, 1.38, 1.1, 2.94, 1.54, 1.2, 10.73, 0.56, 0.46, 3.08, 4.79, 0.76, 1.52, 1.19, 1.13, 2.62, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/w8IS7igzQxw_filtered.json b/annotations_filtered/w8IS7igzQxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bf7958eeadab23591fc805a4c0e92de0eca9148 --- /dev/null +++ b/annotations_filtered/w8IS7igzQxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.32], [16.0, 21.09], [23.0, 33.32], [36.0, 39.01], [50.0, 74.93], [76.0, 79.59], [85.0, 144.46], [148.0, 148.44], [150.0, 150.6], [152.0, 152.46]], "keep_status": [true, true, false, false, false, false, false, false, false, false], "silence_prob": [43.43, 39.3, 73.97, 70.44, 44.18, 37.46, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.85], ["throbbing", 10.13], ["hum", 5.97]], [["music", 27.74], ["hum", 22.18], ["throbbing", 14.08]], null, null, [["hum", 38.28], ["mains hum", 18.17], ["music", 15.78]], [["cattle, bovinae", 43.91], ["moo", 29.42], ["livestock, farm animals, working animals", 25.29]], null, null, null, null], "duration": [7.32, 5.09, 10.32, 3.01, 24.93, 3.59, 59.46, 0.44, 0.6, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/w8O0iiBrIzM_filtered.json b/annotations_filtered/w8O0iiBrIzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bce0d0c727613e02b2c081af2900cca9c1a4034b --- /dev/null +++ b/annotations_filtered/w8O0iiBrIzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [13.0, 14.72]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.13, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/w8mbmSijd4o_filtered.json b/annotations_filtered/w8mbmSijd4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba619410341bb870e6b8df835be4928a0476913 --- /dev/null +++ b/annotations_filtered/w8mbmSijd4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.17], [24.0, 26.1], [28.0, 28.66], [29.0, 33.88], [35.0, 41.27], [44.0, 44.74], [46.0, 48.03], [49.0, 49.99], [51.0, 53.25], [57.0, 60.4], [61.0, 60.84], [63.0, 63.53], [69.0, 68.99], [72.0, 71.95], [85.0, 86.56], [89.0, 90.0], [94.0, 94.74], [101.0, 102.22], [105.0, 105.61], [107.0, 107.82], [110.0, 110.22], [111.0, 119.2], [120.0, 129.07], [131.0, 133.35], [133.0, 133.39], [136.0, 136.04], [140.0, 141.52], [145.0, 146.18], [149.0, 149.32], [151.0, 151.14], [153.0, 153.28], [154.0, 154.3], [156.0, 155.87], [157.0, 157.54], [158.0, 158.52], [162.0, 161.97], [163.0, 163.98], [165.0, 165.65], [169.0, 177.36], [179.0, 179.78], [182.0, 182.02], [183.0, 184.35]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.27, 0.0, 33.84, 63.31, 0.0, 65.79, 0.0, 97.83, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 100.0, 46.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.22], ["musical instrument", 15.65], ["didgeridoo", 11.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.31], ["sidetone", 22.02], ["radio", 20.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 2.1, 0.66, 4.88, 6.27, 0.74, 2.03, 0.99, 2.25, 3.4, -0.16, 0.53, -0.01, -0.05, 1.56, 1.0, 0.74, 1.22, 0.61, 0.82, 0.22, 8.2, 9.07, 2.35, 0.39, 0.04, 1.52, 1.18, 0.32, 0.14, 0.28, 0.3, -0.13, 0.54, 0.52, -0.03, 0.98, 0.65, 8.36, 0.78, 0.02, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/w8td2mMGYjo_filtered.json b/annotations_filtered/w8td2mMGYjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3872b06a8961843eac7b679ea2b594c369db35c --- /dev/null +++ b/annotations_filtered/w8td2mMGYjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 34.37], [35.0, 42.03], [44.0, 46.74], [48.0, 48.46], [52.0, 58.45], [63.0, 64.56], [65.0, 65.96], [67.0, 73.47]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [99.9, 100.0, 100.0, 0.0, 45.52, 0.0, 0.0, 64.97], "audiomae_on_audioset": [null, null, null, null, [["speech", 75.58], ["sidetone", 2.62], ["stomach rumble", 1.44]], null, null, null], "duration": [16.37, 7.03, 2.74, 0.46, 6.45, 1.56, 0.96, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/w8txE148NNI_filtered.json b/annotations_filtered/w8txE148NNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9b9ee2c39e1730acac913eee0f386c85fd5a6a8 --- /dev/null +++ b/annotations_filtered/w8txE148NNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [3.0, 3.33], [6.0, 6.44], [8.0, 9.44], [11.0, 12.97], [22.0, 22.94], [24.0, 29.57], [34.0, 36.64], [37.0, 37.32], [41.0, 40.66], [41.0, 41.71], [49.0, 50.33], [51.0, 51.97], [66.0, 66.93], [68.0, 69.77], [71.0, 71.58], [73.0, 74.34], [74.0, 74.49], [75.0, 76.1], [82.0, 84.25], [88.0, 89.38], [92.0, 93.99], [97.0, 105.0], [111.0, 111.48], [116.0, 116.83], [124.0, 125.19], [126.0, 127.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 72.64], ["music", 2.98], ["inside, small room", 2.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.78], ["speech", 19.91], ["sidetone", 7.43]], null, null, null, null], "duration": [0.92, 0.33, 0.44, 1.44, 1.97, 0.94, 5.57, 2.64, 0.32, -0.34, 0.71, 1.33, 0.97, 0.93, 1.77, 0.58, 1.34, 0.49, 1.1, 2.25, 1.38, 1.99, 8.0, 0.48, 0.83, 1.19, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/w9-IJEaGhRg_filtered.json b/annotations_filtered/w9-IJEaGhRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e554a639bc9877fd829e810725ff84144bd5256c --- /dev/null +++ b/annotations_filtered/w9-IJEaGhRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 27.84], [31.0, 33.0], [35.0, 34.57], [36.0, 39.58], [41.0, 42.53], [43.0, 45.05], [47.0, 47.17], [48.0, 49.4], [53.0, 54.18], [60.0, 61.06], [66.0, 67.8], [71.0, 70.97], [75.0, 77.26], [79.0, 79.71], [81.0, 81.36], [82.0, 82.95], [87.0, 87.56], [93.0, 92.79], [94.0, 95.12], [96.0, 97.09], [99.0, 105.53]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.84, 52.62, 0.0, 70.44, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99], "audiomae_on_audioset": [[["hum", 38.49], ["mains hum", 18.31], ["speech", 18.26]], null, null, null, null, [["stomach rumble", 16.02], ["water", 11.26], ["liquid", 9.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.84, 2.0, -0.43, 3.58, 1.53, 2.05, 0.17, 1.4, 1.18, 1.06, 1.8, -0.03, 2.26, 0.71, 0.36, 0.95, 0.56, -0.21, 1.12, 1.09, 6.53]} \ No newline at end of file diff --git a/annotations_filtered/w9-ylaUijdc_filtered.json b/annotations_filtered/w9-ylaUijdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..896ee89d3046fffcc048acd97e52058c540f1dfd --- /dev/null +++ b/annotations_filtered/w9-ylaUijdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.99], [29.0, 29.91], [33.0, 36.85], [39.0, 41.45], [42.0, 44.42], [48.0, 49.94], [53.0, 56.05], [58.0, 58.13], [64.0, 64.83], [66.0, 68.69], [73.0, 73.3], [76.0, 77.75], [82.0, 82.56], [86.0, 87.57], [90.0, 90.88], [93.0, 93.82], [95.0, 95.76], [97.0, 97.75], [99.0, 98.95], [100.0, 101.11], [102.0, 102.34], [119.0, 119.03], [121.0, 121.64], [126.0, 126.79], [128.0, 128.49], [134.0, 134.77], [145.0, 146.42], [148.0, 148.56], [152.0, 152.29], [157.0, 158.97], [162.0, 162.6], [163.0, 170.43], [173.0, 173.31], [174.0, 175.07]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.94, 0.0, 59.59, 50.86, 41.76, 0.0, 90.25, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.14], ["throbbing", 18.74], ["hum", 18.2]], null, null, null, [["speech", 15.02], ["reverberation", 8.0], ["effects unit", 5.3]], null, null, null, null, [["speech", 37.18], ["dial tone", 12.53], ["sidetone", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.48], ["musical instrument", 12.0], ["didgeridoo", 5.57]], null, null], "duration": [24.99, 0.91, 3.85, 2.45, 2.42, 1.94, 3.05, 0.13, 0.83, 2.69, 0.3, 1.75, 0.56, 1.57, 0.88, 0.82, 0.76, 0.75, -0.05, 1.11, 0.34, 0.03, 0.64, 0.79, 0.49, 0.77, 1.42, 0.56, 0.29, 1.97, 0.6, 7.43, 0.31, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/w98xbfLGWro_filtered.json b/annotations_filtered/w98xbfLGWro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca8bd7c2d50591c94e56ce55cf5a87733451925b --- /dev/null +++ b/annotations_filtered/w98xbfLGWro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.27], [22.0, 29.19], [31.0, 31.02], [32.0, 33.4], [35.0, 35.87], [37.0, 37.71], [38.0, 38.74], [39.0, 40.29], [43.0, 43.56], [46.0, 47.49], [49.0, 51.75], [54.0, 54.75], [55.0, 56.1], [57.0, 59.29], [62.0, 65.77], [67.0, 67.8], [82.0, 83.62], [88.0, 90.64], [93.0, 93.8], [96.0, 96.38], [97.0, 98.85], [109.0, 109.49], [115.0, 117.71], [119.0, 119.67], [121.0, 124.02], [126.0, 126.45], [127.0, 127.85], [129.0, 133.54], [135.0, 136.29], [139.0, 142.77], [143.0, 144.51], [145.0, 147.18], [148.0, 150.52], [151.0, 152.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.48, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 99.44, 98.8, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 99.9, 0.0, 0.0, 100.0, 0.0, 99.05, 0.0, 99.94, 92.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.27, 7.19, 0.02, 1.4, 0.87, 0.71, 0.74, 1.29, 0.56, 1.49, 2.75, 0.75, 1.1, 2.29, 3.77, 0.8, 1.62, 2.64, 0.8, 0.38, 1.85, 0.49, 2.71, 0.67, 3.02, 0.45, 0.85, 4.54, 1.29, 3.77, 1.51, 2.18, 2.52, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/w9I7PBSMBZw_filtered.json b/annotations_filtered/w9I7PBSMBZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8f98f94e73e22b6aea685827b300870b844e12 --- /dev/null +++ b/annotations_filtered/w9I7PBSMBZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.28], [22.0, 32.41], [34.0, 34.2], [35.0, 35.38], [38.0, 38.18], [43.0, 43.29], [45.0, 45.82], [51.0, 52.39], [56.0, 61.94], [62.0, 63.59], [66.0, 100.45], [101.0, 111.15]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 42.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.44, 0.0, 0.0, 38.06], "audiomae_on_audioset": [null, [["music", 71.43], ["soundtrack music", 6.24], ["electronic music", 5.0]], null, null, null, null, null, null, [["speech", 34.19], ["music", 27.23], ["electronic music", 6.42]], null, null, [["music", 62.14], ["speech", 7.56], ["foghorn", 4.5]]], "duration": [0.28, 10.41, 0.2, 0.38, 0.18, 0.29, 0.82, 1.39, 5.94, 1.59, 34.45, 10.15]} \ No newline at end of file diff --git a/annotations_filtered/w9KBOhPXhds_filtered.json b/annotations_filtered/w9KBOhPXhds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8346431dc4a99ba13f22b63217f9aad9336cf5e4 --- /dev/null +++ b/annotations_filtered/w9KBOhPXhds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.66], [23.0, 24.29], [32.0, 32.29], [33.0, 35.63], [37.0, 39.29], [42.0, 43.38], [50.0, 51.76], [55.0, 57.11], [58.0, 75.44], [77.0, 79.73], [80.0, 82.04], [84.0, 86.49], [87.0, 87.84], [88.0, 89.97], [91.0, 92.4], [96.0, 96.2], [97.0, 97.63], [98.0, 109.34], [110.0, 110.61], [113.0, 113.44], [117.0, 118.1], [122.0, 126.4], [128.0, 129.36], [131.0, 132.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.19, 100.0, 0.0, 0.0, 99.16, 100.0, 94.66, 67.63, 46.61, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 49.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 68.18], ["speech", 17.81], ["busy signal", 7.51]], null, null, null, null, null, null, null, null, null, [["speech", 58.01], ["sidetone", 20.28], ["fart", 8.87]], null, null], "duration": [0.66, 1.29, 0.29, 2.63, 2.29, 1.38, 1.76, 2.11, 17.44, 2.73, 2.04, 2.49, 0.84, 1.97, 1.4, 0.2, 0.63, 11.34, 0.61, 0.44, 1.1, 4.4, 1.36, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/w9sO9o8LNvQ_filtered.json b/annotations_filtered/w9sO9o8LNvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58edb48ca8a8d7afaae44c2bd6293d91197a557a --- /dev/null +++ b/annotations_filtered/w9sO9o8LNvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.61], [122.0, 126.4]], "keep_status": [false, true], "silence_prob": [32.76, 30.6], "audiomae_on_audioset": [[["music", 48.92], ["throbbing", 24.54], ["hum", 9.91]], [["throbbing", 31.49], ["hum", 19.43], ["music", 11.5]]], "duration": [8.61, 4.4]} \ No newline at end of file diff --git a/annotations_filtered/wAE0vlaKvkM_filtered.json b/annotations_filtered/wAE0vlaKvkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..373bb55a63c41525819f1d473a7e345228e75753 --- /dev/null +++ b/annotations_filtered/wAE0vlaKvkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.07], [10.0, 14.42], [29.0, 32.37], [46.0, 47.58], [52.0, 52.78], [59.0, 59.71], [65.0, 65.18], [80.0, 82.66], [89.0, 89.94], [93.0, 94.95], [99.0, 100.47], [104.0, 104.89], [110.0, 110.4], [112.0, 113.63], [119.0, 120.09], [120.0, 122.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.46, 38.37, 90.78, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53], "audiomae_on_audioset": [null, [["speech", 82.92], ["boing", 3.08], ["hum", 2.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.07, 4.42, 3.37, 1.58, 0.78, 0.71, 0.18, 2.66, 0.94, 1.95, 1.47, 0.89, 0.4, 1.63, 1.09, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/wAE_PelhISM_filtered.json b/annotations_filtered/wAE_PelhISM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7542b18fffd012d12b419f87ef0072effec3183f --- /dev/null +++ b/annotations_filtered/wAE_PelhISM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.71], [9.0, 9.91], [11.0, 15.84], [19.0, 18.84], [19.0, 19.82], [20.0, 19.95], [20.0, 20.07], [20.0, 31.45], [34.0, 36.29], [38.0, 39.26], [45.0, 51.54], [52.0, 55.26], [64.0, 65.13], [66.0, 68.69], [71.0, 74.22], [83.0, 114.94], [115.0, 128.09]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 29.44, 0.0, 0.0, 0.0, 0.0, 28.57, 30.12, 0.0, 35.89, 29.74, 0.0, 28.94, 28.82, 0.0, 28.96], "audiomae_on_audioset": [null, null, [["speech", 56.55], ["music", 6.2], ["hum", 6.08]], null, null, null, null, [["cattle, bovinae", 37.14], ["livestock, farm animals, working animals", 34.25], ["moo", 21.1]], [["music", 18.74], ["explosion", 15.23], ["speech", 12.49]], null, [["music", 67.84], ["hum", 5.45], ["didgeridoo", 4.95]], [["speech", 28.87], ["music", 21.6], ["didgeridoo", 6.17]], null, [["livestock, farm animals, working animals", 49.89], ["moo", 18.44], ["cattle, bovinae", 17.07]], [["speech", 60.79], ["electric shaver, electric razor", 4.0], ["livestock, farm animals, working animals", 3.74]], null, [["animal", 23.28], ["music", 10.22], ["livestock, farm animals, working animals", 10.22]]], "duration": [0.71, 0.91, 4.84, -0.16, 0.82, -0.05, 0.07, 11.45, 2.29, 1.26, 6.54, 3.26, 1.13, 2.69, 3.22, 31.94, 13.09]} \ No newline at end of file diff --git a/annotations_filtered/wAJQ-yWgSJs_filtered.json b/annotations_filtered/wAJQ-yWgSJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a890685024d9b58d9ecdf383915f7bef5b8178ca --- /dev/null +++ b/annotations_filtered/wAJQ-yWgSJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [16.0, 16.53], [19.0, 19.3], [23.0, 22.84], [24.0, 26.35], [28.0, 31.16], [34.0, 41.32], [46.0, 46.45], [51.0, 54.41], [87.0, 96.77], [97.0, 98.41], [100.0, 101.68], [109.0, 110.51], [112.0, 117.05], [119.0, 122.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.97, 93.76, 96.29, 0.0, 97.92, 67.13, 0.0, 0.0, 0.0, 99.98, 75.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.53, 0.3, -0.16, 2.35, 3.16, 7.32, 0.45, 3.41, 9.77, 1.41, 1.68, 1.51, 5.05, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/wALbxbEBLU0_filtered.json b/annotations_filtered/wALbxbEBLU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62a2c6c808c991ee2e9c94cf80e1409b8649a106 --- /dev/null +++ b/annotations_filtered/wALbxbEBLU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [18.0, 19.28], [20.0, 21.03], [22.0, 26.22], [30.0, 32.48], [33.0, 35.63], [45.0, 48.88], [53.0, 54.72]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 39.17, 30.5, 30.64, 40.28, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 70.0], ["electric shaver, electric razor", 4.62], ["hum", 4.13]], [["speech", 70.52], ["radio", 5.84], ["telephone", 4.93]], [["boing", 20.9], ["speech", 12.3], ["snicker", 8.87]], [["speech", 38.7], ["hum", 21.4], ["throbbing", 8.77]], null], "duration": [1.23, 1.28, 1.03, 4.22, 2.48, 2.63, 3.88, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/wAZ6dSIMivk_filtered.json b/annotations_filtered/wAZ6dSIMivk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae2d1ea34b7c018f54af71b816c32d344ddc445e --- /dev/null +++ b/annotations_filtered/wAZ6dSIMivk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.74], [15.0, 16.41], [20.0, 20.85], [22.0, 22.71], [25.0, 25.42], [31.0, 31.72], [35.0, 35.06], [40.0, 40.91], [42.0, 43.75], [45.0, 46.9], [48.0, 48.12], [50.0, 50.63], [54.0, 54.82], [57.0, 58.48], [64.0, 64.62], [73.0, 74.7], [75.0, 77.87], [79.0, 86.75], [91.0, 104.87], [106.0, 113.86]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [40.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 79.59, 46.97, 44.26], "audiomae_on_audioset": [[["music", 22.22], ["cowbell", 21.95], ["livestock, farm animals, working animals", 18.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.15], ["theremin", 19.2], ["livestock, farm animals, working animals", 9.04]], [["cowbell", 20.7], ["livestock, farm animals, working animals", 20.39], ["insect", 13.35]]], "duration": [8.74, 1.41, 0.85, 0.71, 0.42, 0.72, 0.06, 0.91, 1.75, 1.9, 0.12, 0.63, 0.82, 1.48, 0.62, 1.7, 2.87, 7.75, 13.87, 7.86]} \ No newline at end of file diff --git a/annotations_filtered/wAadouGkwMQ_filtered.json b/annotations_filtered/wAadouGkwMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..437a8ea6db410c230fefbd7be544e374afded149 --- /dev/null +++ b/annotations_filtered/wAadouGkwMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 36.49], [47.0, 49.37], [55.0, 55.53], [58.0, 59.58], [61.0, 62.61], [64.0, 68.18], [69.0, 70.77], [72.0, 72.13], [72.0, 73.52], [74.0, 75.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.97, 60.32, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.1], ["video game music", 2.66], ["musical instrument", 2.43]], null, null, null, null, null, null, null, null, null], "duration": [10.49, 2.37, 0.53, 1.58, 1.61, 4.18, 1.77, 0.13, 1.52, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/wAjHfBk-ZeY_filtered.json b/annotations_filtered/wAjHfBk-ZeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccb9060dc6d152cef66c7d52a97612873ef7cb8e --- /dev/null +++ b/annotations_filtered/wAjHfBk-ZeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [6.0, 6.32], [7.0, 8.46], [9.0, 10.27], [11.0, 12.12], [13.0, 14.76], [17.0, 17.68], [19.0, 23.63], [25.0, 25.73], [28.0, 30.32], [34.0, 33.84], [36.0, 37.77], [41.0, 41.54], [42.0, 41.62], [43.0, 43.23], [45.0, 45.82], [49.0, 49.99], [52.0, 53.5], [56.0, 55.9], [58.0, 58.73], [63.0, 64.03], [66.0, 66.83], [69.0, 69.96], [80.0, 81.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.32, 1.46, 1.27, 1.12, 1.76, 0.68, 4.63, 0.73, 2.32, -0.16, 1.77, 0.54, -0.38, 0.23, 0.82, 0.99, 1.5, -0.1, 0.73, 1.03, 0.83, 0.96, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/wAuzCjipF00_filtered.json b/annotations_filtered/wAuzCjipF00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce1fcc5158dfb02ce6ce8c2ede5f327224b433e2 --- /dev/null +++ b/annotations_filtered/wAuzCjipF00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.16], [36.0, 37.44], [39.0, 41.23], [42.0, 43.07], [44.0, 47.58], [48.0, 50.43], [51.0, 77.87], [80.0, 83.93], [84.0, 87.29], [89.0, 91.42], [94.0, 94.41], [96.0, 95.99], [101.0, 110.4], [114.0, 114.29], [116.0, 116.95], [118.0, 118.29], [121.0, 122.4], [126.0, 126.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.97, 99.9, 99.21, 92.64, 99.85, 100.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.44, 2.23, 1.07, 3.58, 2.43, 26.87, 3.93, 3.29, 2.42, 0.41, -0.01, 9.4, 0.29, 0.95, 0.29, 1.4, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/wB-4zgJ2LLs_filtered.json b/annotations_filtered/wB-4zgJ2LLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab6b6e1ce87c9acaf2c80b93470325f1e13859b --- /dev/null +++ b/annotations_filtered/wB-4zgJ2LLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.46], [9.0, 9.31], [10.0, 12.77], [14.0, 15.31], [16.0, 18.35], [21.0, 23.03], [35.0, 35.92], [37.0, 38.5], [63.0, 65.26], [67.0, 68.86], [70.0, 94.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.88, 0.0, 98.73, 0.0, 98.86, 94.22, 0.0, 0.0, 88.64, 0.0, 30.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 59.55], ["speech", 9.95], ["boing", 2.99]]], "duration": [3.46, 0.31, 2.77, 1.31, 2.35, 2.03, 0.92, 1.5, 2.26, 1.86, 24.9]} \ No newline at end of file diff --git a/annotations_filtered/wB2w4t9dr0Y_filtered.json b/annotations_filtered/wB2w4t9dr0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5405cf09c95a7e8dcaaa8a1550e9263b877d5875 --- /dev/null +++ b/annotations_filtered/wB2w4t9dr0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.22]} \ No newline at end of file diff --git a/annotations_filtered/wBIVUUflNb4_filtered.json b/annotations_filtered/wBIVUUflNb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa35e903fb50bad1193917398a4b9240a32ebb4c --- /dev/null +++ b/annotations_filtered/wBIVUUflNb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.61], [13.0, 13.44], [14.0, 14.59], [15.0, 15.89], [17.0, 19.03], [20.0, 20.49], [23.0, 23.77], [25.0, 25.47], [33.0, 34.77], [39.0, 39.9], [60.0, 61.1], [64.0, 64.89], [77.0, 76.99], [98.0, 98.39], [120.0, 120.85], [128.0, 128.38], [142.0, 142.64], [211.0, 210.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 53.07], ["throbbing", 10.76], ["hum", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.44, 0.59, 0.89, 2.03, 0.49, 0.77, 0.47, 1.77, 0.9, 1.1, 0.89, -0.01, 0.39, 0.85, 0.38, 0.64, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/wBM9Aa_HG8g_filtered.json b/annotations_filtered/wBM9Aa_HG8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8502f9b2beb62829ddb88211fce67a491f2b4ac5 --- /dev/null +++ b/annotations_filtered/wBM9Aa_HG8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.24], [11.0, 11.57], [12.0, 12.06], [19.0, 19.53], [23.0, 25.32], [28.0, 29.42], [33.0, 32.64], [39.0, 41.23], [42.0, 42.53], [44.0, 44.22], [46.0, 51.46], [53.0, 53.69], [56.0, 56.74], [60.0, 60.79], [62.0, 62.16], [71.0, 72.52], [74.0, 75.36], [76.0, 76.76], [79.0, 80.32], [82.0, 82.32], [83.0, 84.1], [86.0, 87.18], [96.0, 96.48], [98.0, 100.53], [101.0, 101.41], [103.0, 103.59], [104.0, 106.25], [108.0, 108.18], [110.0, 111.7], [112.0, 113.39], [114.0, 114.74], [115.0, 116.01], [117.0, 117.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.18, 0.0, 0.0, 0.0, 45.49, 0.0, 0.0, 99.95, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 26.78], ["noise", 5.39], ["crushing", 4.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.24, 0.57, 0.06, 0.53, 2.32, 1.42, -0.36, 2.23, 0.53, 0.22, 5.46, 0.69, 0.74, 0.79, 0.16, 1.52, 1.36, 0.76, 1.32, 0.32, 1.1, 1.18, 0.48, 2.53, 0.41, 0.59, 2.25, 0.18, 1.7, 1.39, 0.74, 1.01, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/wBxRwF4qnhU_filtered.json b/annotations_filtered/wBxRwF4qnhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef2c883ab75c85e68bce4f50b4a0aff4b1b5228 --- /dev/null +++ b/annotations_filtered/wBxRwF4qnhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.71], [18.0, 19.57], [22.0, 22.42], [32.0, 33.64], [36.0, 36.46], [39.0, 41.18], [42.0, 43.02], [44.0, 44.0], [45.0, 73.92], [76.0, 76.52], [78.0, 79.54], [82.0, 83.07], [85.0, 85.31], [86.0, 86.0], [89.0, 89.02], [91.0, 91.5], [92.0, 93.48], [98.0, 108.77], [110.0, 110.93], [112.0, 116.23], [121.0, 121.47], [122.0, 125.2], [127.0, 127.43], [130.0, 129.74], [134.0, 136.85], [139.0, 139.35], [140.0, 140.07], [141.0, 142.92]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 0.0, 32.21, 0.0, 45.33, 0.0, 0.0, 35.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 19.55], ["noise", 11.07], ["radio", 10.59]], null, null, null, null, null, null, null, null, [["speech", 81.89], ["music", 6.53], ["knock", 2.77]], null, [["knock", 27.23], ["speech", 19.62], ["beatboxing", 9.93]], null, [["speech", 14.98], ["frog", 11.91], ["telephone", 8.05]], null, null, [["speech", 70.55], ["wail, moan", 8.18], ["radio", 3.24]], null, null, null], "duration": [1.71, 1.57, 0.42, 1.64, 0.46, 2.18, 1.02, 0.0, 28.92, 0.52, 1.54, 1.07, 0.31, 0.0, 0.02, 0.5, 1.48, 10.77, 0.93, 4.23, 0.47, 3.2, 0.43, -0.26, 2.85, 0.35, 0.07, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/wC4MzUvxVa0_filtered.json b/annotations_filtered/wC4MzUvxVa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6f2213a2d90ea33346db7b34863ae0cecc02df7 --- /dev/null +++ b/annotations_filtered/wC4MzUvxVa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [8.0, 9.69], [13.0, 13.76], [26.0, 26.7], [28.0, 29.51], [32.0, 34.11], [55.0, 56.78], [59.0, 59.14], [76.0, 76.94], [81.0, 83.35]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 47.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.26], ["musical instrument", 13.49], ["guitar", 11.86]]], "duration": [0.74, 1.69, 0.76, 0.7, 1.51, 2.11, 1.78, 0.14, 0.94, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/wCL3OtOzYuQ_filtered.json b/annotations_filtered/wCL3OtOzYuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf55738d624c3ee48e55b01e9b652f0134fdcdde --- /dev/null +++ b/annotations_filtered/wCL3OtOzYuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 43.28], [47.0, 47.29], [53.0, 54.94], [59.0, 63.14]], "keep_status": [true, false, false, true], "silence_prob": [35.07, 0.0, 0.0, 35.79], "audiomae_on_audioset": [[["music", 29.75], ["speech", 24.02], ["synthesizer", 6.74]], null, null, [["music", 15.63], ["fly, housefly", 13.97], ["mosquito", 10.65]]], "duration": [2.28, 0.29, 1.94, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/wD8pQ5eDneo_filtered.json b/annotations_filtered/wD8pQ5eDneo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b328eee1a8094978d32443693f826cd6d9483dc9 --- /dev/null +++ b/annotations_filtered/wD8pQ5eDneo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [5.0, 6.89], [9.0, 11.38], [13.0, 13.54], [17.0, 19.53], [21.0, 24.21], [26.0, 28.17], [28.0, 29.93], [30.0, 30.89], [32.0, 33.54], [34.0, 35.28], [36.0, 36.54], [37.0, 38.18], [41.0, 42.23], [44.0, 44.86], [45.0, 46.25], [48.0, 48.1], [50.0, 50.5], [51.0, 52.41], [53.0, 54.43], [58.0, 58.19], [61.0, 64.0], [65.0, 66.18], [68.0, 68.82], [70.0, 70.63], [72.0, 72.5], [74.0, 74.46], [76.0, 77.4], [85.0, 85.85], [87.0, 88.59], [92.0, 92.84], [94.0, 94.71], [96.0, 96.79], [98.0, 99.72], [104.0, 104.8], [107.0, 106.73], [108.0, 108.82], [110.0, 111.3], [114.0, 115.32], [117.0, 118.88], [121.0, 122.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 1.89, 2.38, 0.54, 2.53, 3.21, 2.17, 1.93, 0.89, 1.54, 1.28, 0.54, 1.18, 1.23, 0.86, 1.25, 0.1, 0.5, 1.41, 1.43, 0.19, 3.0, 1.18, 0.82, 0.63, 0.5, 0.46, 1.4, 0.85, 1.59, 0.84, 0.71, 0.79, 1.72, 0.8, -0.27, 0.82, 1.3, 1.32, 1.88, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/wDFOO-dC-Nw_filtered.json b/annotations_filtered/wDFOO-dC-Nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18c4c46c5e4ff31fba8d658a060aaf38bf7c59f0 --- /dev/null +++ b/annotations_filtered/wDFOO-dC-Nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.14], [19.0, 22.44], [25.0, 24.95], [28.0, 36.15], [37.0, 37.89], [39.0, 41.23], [42.0, 42.9], [44.0, 44.19], [45.0, 46.09], [47.0, 51.33], [55.0, 55.49], [56.0, 56.86], [60.0, 82.68], [85.0, 86.04], [87.0, 88.43], [92.0, 93.88], [97.0, 97.36], [98.0, 98.17], [102.0, 103.92], [109.0, 120.58], [122.0, 130.64], [132.0, 142.62], [144.0, 148.19], [157.0, 161.5], [162.0, 163.78]], "keep_status": [false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 48.56, 0.0, 31.88, 0.0, 34.85, 0.0, 0.0, 0.0, 31.07, 0.0, 0.0, 44.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 44.69, 62.07, 63.64, 32.16, 0.0], "audiomae_on_audioset": [null, [["music", 65.65], ["throbbing", 6.74], ["synthesizer", 4.33]], null, [["music", 60.92], ["guitar", 2.84], ["musical instrument", 2.76]], null, [["music", 40.92], ["speech", 22.99], ["electronic music", 2.41]], null, null, null, [["music", 45.46], ["hum", 10.25], ["throbbing", 5.61]], null, null, [["fly, housefly", 26.36], ["insect", 16.01], ["hum", 11.55]], null, null, null, null, null, null, [["breaking", 50.36], ["sine wave", 8.79], ["glass", 3.41]], [["hum", 26.21], ["noise", 18.72], ["mains hum", 17.33]], null, null, [["music", 51.38], ["didgeridoo", 11.93], ["synthesizer", 7.12]], null], "duration": [0.14, 3.44, -0.05, 8.15, 0.89, 2.23, 0.9, 0.19, 1.09, 4.33, 0.49, 0.86, 22.68, 1.04, 1.43, 1.88, 0.36, 0.17, 1.92, 11.58, 8.64, 10.62, 4.19, 4.5, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/wDZyu8jYw90_filtered.json b/annotations_filtered/wDZyu8jYw90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..996c1436190ee09e1acdc5c63655190fd4d1a161 --- /dev/null +++ b/annotations_filtered/wDZyu8jYw90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.49], [18.0, 19.25], [26.0, 27.62], [29.0, 30.43], [35.0, 36.31], [42.0, 42.4], [55.0, 62.95], [63.0, 65.72], [70.0, 71.0], [72.0, 72.74], [85.0, 100.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 82.43, 0.0, 0.0, 34.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["thunk", 41.17], ["breaking", 15.82], ["music", 13.01]]], "duration": [6.49, 1.25, 1.62, 1.43, 1.31, 0.4, 7.95, 2.72, 1.0, 0.74, 15.89]} \ No newline at end of file diff --git a/annotations_filtered/wDsYB_uRbaE_filtered.json b/annotations_filtered/wDsYB_uRbaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75e6e22d5ce3ead49e3052754ec34c9ce8d6a40e --- /dev/null +++ b/annotations_filtered/wDsYB_uRbaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [5.0, 8.56], [10.0, 11.89], [13.0, 16.95], [19.0, 19.68], [20.0, 21.52], [26.0, 26.65], [33.0, 34.26], [43.0, 44.17], [45.0, 46.11], [47.0, 47.43], [48.0, 48.15], [50.0, 52.88], [62.0, 64.59], [66.0, 68.55], [70.0, 70.46], [71.0, 78.71], [80.0, 80.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 86.09, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 61.67, 64.52, 0.0, 47.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 21.47], ["hum", 17.59], ["music", 16.63]], null], "duration": [0.47, 3.56, 1.89, 3.95, 0.68, 1.52, 0.65, 1.26, 1.17, 1.11, 0.43, 0.15, 2.88, 2.59, 2.55, 0.46, 7.71, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/wEByIZn5qeU_filtered.json b/annotations_filtered/wEByIZn5qeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..299382f4720c1a90863db1d5548e91026ba81f01 --- /dev/null +++ b/annotations_filtered/wEByIZn5qeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.95], [11.0, 13.46], [17.0, 20.24], [21.0, 22.54], [25.0, 26.89], [27.0, 29.51], [31.0, 33.03], [53.0, 53.79], [55.0, 55.22], [58.0, 58.97], [61.0, 62.34], [63.0, 64.52], [66.0, 72.4], [75.0, 76.4], [78.0, 79.08], [81.0, 82.05]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 67.0, 40.12, 0.0, 0.0, 70.16, 42.98, 0.0, 0.0, 0.0, 0.0, 0.0, 34.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 19.96], ["speech", 17.15], ["goat", 7.52]], null, null, null, [["speech", 20.97], ["music", 9.57], ["musical instrument", 4.65]], null, null, null, null, null, [["music", 14.93], ["hum", 9.46], ["noise", 8.13]], null, null, null], "duration": [1.95, 2.46, 3.24, 1.54, 1.89, 2.51, 2.03, 0.79, 0.22, 0.97, 1.34, 1.52, 6.4, 1.4, 1.08, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/wEE-EVC0P8M_filtered.json b/annotations_filtered/wEE-EVC0P8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b511a5c01b2534e22fa2e919e8c8497c654960d --- /dev/null +++ b/annotations_filtered/wEE-EVC0P8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.03], [16.0, 16.16], [21.0, 21.1], [23.0, 25.96], [34.0, 34.45], [35.0, 36.12], [42.0, 44.41], [53.0, 53.7], [54.0, 54.6], [60.0, 60.99], [64.0, 68.13], [76.0, 76.05], [78.0, 83.93], [85.0, 88.55], [90.0, 93.02], [98.0, 99.0], [101.0, 100.92], [101.0, 105.9], [107.0, 111.72], [117.0, 120.46], [124.0, 123.6], [126.0, 126.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.72, 0.0, 0.0, 34.44, 0.0, 0.0, 41.4, 0.0, 0.0, 0.0, 35.52, 0.0, 60.05, 93.76, 93.91, 0.0, 0.0, 72.6, 62.89, 90.95, 0.0, 0.0], "audiomae_on_audioset": [[["music", 66.96], ["musical instrument", 3.06], ["rock music", 2.69]], null, null, [["music", 61.76], ["speech", 6.29], ["musical instrument", 6.17]], null, null, [["music", 51.44], ["guitar", 4.53], ["synthesizer", 4.19]], null, null, null, [["music", 56.74], ["didgeridoo", 8.33], ["speech", 6.14]], null, null, null, null, null, null, null, null, null, null, null], "duration": [9.03, 0.16, 0.1, 2.96, 0.45, 1.12, 2.41, 0.7, 0.6, 0.99, 4.13, 0.05, 5.93, 3.55, 3.02, 1.0, -0.08, 4.9, 4.72, 3.46, -0.4, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/wEPZVYQqdMY_filtered.json b/annotations_filtered/wEPZVYQqdMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af204800bb6e4533dca9a02192109d0d5d1e98b9 --- /dev/null +++ b/annotations_filtered/wEPZVYQqdMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [6.0, 143.65], [145.0, 152.44], [153.0, 155.29], [157.0, 159.39]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.02, 38.54, 68.41], "audiomae_on_audioset": [null, null, [["music", 76.19], ["synthesizer", 4.28], ["hum", 2.75]], [["speech", 17.29], ["boing", 8.3], ["music", 5.17]], null], "duration": [1.25, 137.65, 7.44, 2.29, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/wEUwtFg7PeI_filtered.json b/annotations_filtered/wEUwtFg7PeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f0436dae9bea59e7f572e95ed06358cc7951529 --- /dev/null +++ b/annotations_filtered/wEUwtFg7PeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 70.97], [78.0, 91.45], [94.0, 117.41], [119.0, 136.43]], "keep_status": [false, true, true, true], "silence_prob": [0.0, 30.99, 30.12, 30.69], "audiomae_on_audioset": [null, [["speech", 27.03], ["music", 16.68], ["vehicle", 6.29]], [["music", 29.66], ["speech", 24.04], ["vehicle", 3.82]], [["music", 31.27], ["hum", 7.03], ["speech", 5.62]]], "duration": [51.97, 13.45, 23.41, 17.43]} \ No newline at end of file diff --git a/annotations_filtered/wEnaRGQc8Ls_filtered.json b/annotations_filtered/wEnaRGQc8Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4ab6a9a19c2ce24d5bee75abb965b5b3ede83d2 --- /dev/null +++ b/annotations_filtered/wEnaRGQc8Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.87], [21.0, 22.05], [23.0, 29.32], [31.0, 36.17], [36.0, 44.63], [46.0, 51.49], [60.0, 60.15], [63.0, 64.39], [66.0, 67.36], [70.0, 74.76], [78.0, 81.82], [84.0, 84.3], [92.0, 92.13], [97.0, 96.94], [98.0, 100.99], [103.0, 103.65], [105.0, 106.27], [107.0, 111.6], [115.0, 117.68], [119.0, 122.89], [124.0, 129.22]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [73.82, 0.0, 94.81, 97.33, 47.01, 58.05, 0.0, 0.0, 0.0, 49.87, 51.02, 0.0, 0.0, 0.0, 34.57, 0.0, 0.0, 39.38, 53.78, 60.6, 69.88], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.35], ["music", 18.34], ["fly, housefly", 11.52]], null, null, null, null, [["speech", 25.31], ["music", 19.89], ["hum", 10.86]], null, null, null, null, [["foghorn", 38.88], ["music", 21.86], ["speech", 11.03]], null, null, [["foghorn", 32.55], ["music", 20.62], ["speech", 8.98]], null, null, null], "duration": [9.87, 1.05, 6.32, 5.17, 8.63, 5.49, 0.15, 1.39, 1.36, 4.76, 3.82, 0.3, 0.13, -0.06, 2.99, 0.65, 1.27, 4.6, 2.68, 3.89, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/wEvSZB_Dhqc_filtered.json b/annotations_filtered/wEvSZB_Dhqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2226672dcee08d27b94c1ee94fef5230d1adf1ee --- /dev/null +++ b/annotations_filtered/wEvSZB_Dhqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.96], [18.0, 19.35], [22.0, 24.66], [28.0, 33.94], [34.0, 34.13], [36.0, 44.46], [49.0, 49.92], [55.0, 60.0], [71.0, 83.89], [89.0, 103.01], [106.0, 106.96], [113.0, 119.28], [139.0, 149.54], [151.0, 151.44], [156.0, 156.29], [157.0, 158.89], [165.0, 174.12], [178.0, 178.83], [181.0, 199.39], [200.0, 203.81], [205.0, 206.47], [213.0, 224.01]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [32.74, 0.0, 32.8, 32.34, 0.0, 30.84, 0.0, 31.15, 31.36, 31.36, 0.0, 31.69, 31.28, 0.0, 0.0, 0.0, 30.38, 0.0, 31.63, 56.4, 0.0, 41.46], "audiomae_on_audioset": [[["music", 36.49], ["hum", 15.96], ["throbbing", 11.78]], null, [["music", 39.11], ["speech", 12.65], ["throbbing", 8.88]], [["music", 58.28], ["sidetone", 15.6], ["boing", 3.78]], null, [["music", 42.28], ["throbbing", 16.54], ["hum", 12.51]], null, [["speech", 50.79], ["music", 34.93], ["boing", 2.88]], [["music", 57.16], ["speech", 15.12], ["electronic music", 3.38]], [["music", 75.99], ["speech", 2.84], ["boing", 2.6]], null, [["throbbing", 24.61], ["music", 24.21], ["hum", 9.99]], [["music", 34.09], ["speech", 28.14], ["sidetone", 9.46]], null, null, null, [["speech", 51.0], ["music", 27.01], ["electronic music", 2.01]], null, [["music", 49.25], ["didgeridoo", 8.71], ["livestock, farm animals, working animals", 4.44]], null, null, [["sidetone", 27.38], ["fly, housefly", 16.61], ["speech", 12.94]]], "duration": [3.96, 1.35, 2.66, 5.94, 0.13, 8.46, 0.92, 5.0, 12.89, 14.01, 0.96, 6.28, 10.54, 0.44, 0.29, 1.89, 9.12, 0.83, 18.39, 3.81, 1.47, 11.01]} \ No newline at end of file diff --git a/annotations_filtered/wEzZX_MFu4w_filtered.json b/annotations_filtered/wEzZX_MFu4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1beb1229a4fe217dc33947c526d8eac5d7cea49c --- /dev/null +++ b/annotations_filtered/wEzZX_MFu4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.88], [10.0, 16.21], [25.0, 29.78], [30.0, 31.11], [34.0, 33.66], [34.0, 34.2], [35.0, 36.53], [39.0, 39.99], [66.0, 66.8], [67.0, 68.52], [69.0, 70.23], [72.0, 73.75]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.03, 30.34, 34.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.47], ["speech", 28.7], ["boing", 3.01]], [["music", 74.44], ["musical instrument", 7.02], ["plucked string instrument", 2.47]], [["speech", 30.1], ["music", 9.15], ["musical instrument", 6.96]], null, null, null, null, null, null, null, null, null], "duration": [3.88, 6.21, 4.78, 1.11, -0.34, 0.2, 1.53, 0.99, 0.8, 1.52, 1.23, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/wF6xVdnFJho_filtered.json b/annotations_filtered/wF6xVdnFJho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25dc9f06fc53d0800aaba2c500e225583c774561 --- /dev/null +++ b/annotations_filtered/wF6xVdnFJho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 21.15], [22.0, 54.87], [56.0, 56.93], [58.0, 58.51], [61.0, 61.94], [68.0, 71.98], [73.0, 79.49], [84.0, 84.97], [86.0, 89.16], [93.0, 95.69], [105.0, 109.12], [111.0, 113.58], [116.0, 118.81], [119.0, 124.23], [125.0, 131.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [29.81, 0.0, 0.0, 0.0, 0.0, 99.56, 97.43, 0.0, 99.71, 99.95, 99.85, 57.56, 56.18, 40.92, 39.21], "audiomae_on_audioset": [[["music", 56.93], ["theremin", 8.41], ["synthesizer", 8.11]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.51], ["musical instrument", 6.93], ["effects unit", 5.3]], [["throbbing", 18.94], ["music", 17.24], ["echo", 15.94]]], "duration": [12.15, 32.87, 0.93, 0.51, 0.94, 3.98, 6.49, 0.97, 3.16, 2.69, 4.12, 2.58, 2.81, 5.23, 6.01]} \ No newline at end of file diff --git a/annotations_filtered/wFSWmfqMp7o_filtered.json b/annotations_filtered/wFSWmfqMp7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f47dbc4d517aa3d9fe83323df0e9215e91f5133 --- /dev/null +++ b/annotations_filtered/wFSWmfqMp7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.71], [2.0, 9.66], [25.0, 35.38], [40.0, 40.71], [44.0, 49.0], [56.0, 60.69], [79.0, 84.77], [89.0, 98.71], [102.0, 104.19], [109.0, 119.5]], "keep_status": [false, true, true, false, false, false, false, true, true, true], "silence_prob": [0.0, 36.89, 33.75, 0.0, 36.79, 34.77, 33.81, 32.01, 32.66, 32.23], "audiomae_on_audioset": [null, [["theremin", 12.11], ["music", 12.1], ["hum", 7.58]], [["speech", 35.01], ["throbbing", 13.12], ["hum", 10.92]], null, [["speech", 60.24], ["music", 7.88], ["moo", 2.16]], [["speech", 61.46], ["radio", 7.04], ["music", 3.09]], [["cattle, bovinae", 35.36], ["moo", 34.81], ["livestock, farm animals, working animals", 21.34]], [["vehicle", 21.09], ["cacophony", 5.52], ["frog", 5.31]], [["speech", 39.77], ["crowd", 8.52], ["fly, housefly", 6.86]], [["speech", 11.71], ["sheep", 10.79], ["buzz", 9.86]]], "duration": [-0.29, 7.66, 10.38, 0.71, 5.0, 4.69, 5.77, 9.71, 2.19, 10.5]} \ No newline at end of file diff --git a/annotations_filtered/wF_UpYqYJuY_filtered.json b/annotations_filtered/wF_UpYqYJuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69bacbbb525e49e5a2a1c8a57cddba876609968d --- /dev/null +++ b/annotations_filtered/wF_UpYqYJuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.14], [14.0, 14.61], [17.0, 17.59], [22.0, 23.23], [25.0, 26.69], [30.0, 31.56], [35.0, 37.08], [39.0, 79.2]], "keep_status": [true, false, false, false, false, false, true, false], "silence_prob": [37.63, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0], "audiomae_on_audioset": [[["music", 26.5], ["hum", 9.95], ["sine wave", 9.12]], null, null, null, null, null, [["music", 46.18], ["hum", 6.0], ["synthesizer", 3.74]], null], "duration": [9.14, 0.61, 0.59, 1.23, 1.69, 1.56, 2.08, 40.2]} \ No newline at end of file diff --git a/annotations_filtered/wFg1qWPryvI_filtered.json b/annotations_filtered/wFg1qWPryvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c25abf5add042d033b6ce4f9fe09ead85f175bb9 --- /dev/null +++ b/annotations_filtered/wFg1qWPryvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.47], [24.0, 24.71], [26.0, 28.43], [30.0, 35.36], [37.0, 38.6], [39.0, 40.69], [43.0, 46.45], [48.0, 49.1], [52.0, 52.64], [56.0, 55.81], [57.0, 58.43], [60.0, 61.13], [63.0, 64.23], [66.0, 67.09], [73.0, 77.03], [78.0, 79.02], [80.0, 80.59], [84.0, 84.86], [88.0, 89.09], [91.0, 93.56], [94.0, 97.85], [99.0, 103.0], [112.0, 112.26], [113.0, 113.68], [117.0, 134.22], [135.0, 141.22], [145.0, 154.52], [155.0, 154.57], [155.0, 155.61], [158.0, 159.43], [160.0, 161.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.07, 45.59, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 0.0, 35.47, 40.14, 39.55, 0.0, 0.0, 44.55, 33.25, 35.71, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 51.71], ["speech", 25.98], ["music", 11.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.84], ["music", 10.27], ["hum", 10.01]], [["music", 35.06], ["rumble", 12.48], ["speech", 6.48]], [["music", 47.02], ["speech", 30.98], ["hum", 5.61]], null, null, [["music", 51.32], ["throbbing", 18.55], ["hum", 9.78]], [["hum", 45.53], ["throbbing", 18.8], ["mains hum", 17.16]], [["hum", 51.04], ["throbbing", 19.36], ["mains hum", 19.13]], null, null, null, null], "duration": [1.47, 0.71, 2.43, 5.36, 1.6, 1.69, 3.45, 1.1, 0.64, -0.19, 1.43, 1.13, 1.23, 1.09, 4.03, 1.02, 0.59, 0.86, 1.09, 2.56, 3.85, 4.0, 0.26, 0.68, 17.22, 6.22, 9.52, -0.43, 0.61, 1.43, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/wG5Lt-pineg_filtered.json b/annotations_filtered/wG5Lt-pineg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..794732f3d0c2ca3b3afb8cdf63285e28d968ad37 --- /dev/null +++ b/annotations_filtered/wG5Lt-pineg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.21], [24.0, 24.95], [27.0, 32.78], [35.0, 43.51]], "keep_status": [false, false, true, true], "silence_prob": [31.13, 0.0, 33.84, 28.7], "audiomae_on_audioset": [[["speech", 50.8], ["music", 29.97], ["didgeridoo", 1.67]], null, [["music", 54.72], ["hum", 5.97], ["didgeridoo", 4.76]], [["mosquito", 27.42], ["fly, housefly", 24.86], ["music", 14.43]]], "duration": [9.21, 0.95, 5.78, 8.51]} \ No newline at end of file diff --git a/annotations_filtered/wG6wio8azyE_filtered.json b/annotations_filtered/wG6wio8azyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e44e654fd7b7e09fe529a2cd48aeda5ece29a047 --- /dev/null +++ b/annotations_filtered/wG6wio8azyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.55], [14.0, 15.42], [19.0, 20.63], [25.0, 28.61], [34.0, 36.41], [40.0, 41.84], [45.0, 54.38], [55.0, 55.85], [56.0, 57.84], [60.0, 60.13], [61.0, 64.18], [65.0, 66.55], [68.0, 68.07], [70.0, 70.17], [72.0, 71.71], [75.0, 76.23], [77.0, 77.99], [79.0, 79.74], [82.0, 82.46], [83.0, 83.98]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.72, 42.33, 0.0, 69.07, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 40.47], ["didgeridoo", 7.02], ["theremin", 6.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 1.42, 1.63, 3.61, 2.41, 1.84, 9.38, 0.85, 1.84, 0.13, 3.18, 1.55, 0.07, 0.17, -0.29, 1.23, 0.99, 0.74, 0.46, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/wGvGiFhbmwg_filtered.json b/annotations_filtered/wGvGiFhbmwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wGvGiFhbmwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wH-i4ImreXs_filtered.json b/annotations_filtered/wH-i4ImreXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1456753ff89aad89f71702d71e471965ed7077e3 --- /dev/null +++ b/annotations_filtered/wH-i4ImreXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 3.59], [5.0, 5.88], [7.0, 8.33], [10.0, 10.96], [12.0, 12.39], [15.0, 15.3], [20.0, 22.06], [23.0, 23.41], [25.0, 25.54], [26.0, 26.43], [28.0, 29.73], [30.0, 32.7], [34.0, 34.69], [36.0, 36.32], [38.0, 38.92], [41.0, 42.36], [44.0, 44.17], [45.0, 45.44], [46.0, 47.73], [48.0, 49.59], [51.0, 51.34], [53.0, 58.95], [59.0, 59.93], [63.0, 64.32], [65.0, 65.01], [66.0, 68.27], [70.0, 70.63], [73.0, 74.09], [75.0, 75.66], [78.0, 78.04], [79.0, 80.25], [82.0, 82.11], [83.0, 83.98], [85.0, 85.83], [87.0, 90.95], [92.0, 93.51], [94.0, 95.4], [96.0, 100.11], [102.0, 106.02], [106.0, 114.35], [116.0, 115.94], [117.0, 117.86], [119.0, 119.94], [121.0, 121.9], [123.0, 127.06], [127.0, 128.6], [129.0, 131.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.62, 76.04, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.59, 0.88, 1.33, 0.96, 0.39, 0.3, 2.06, 0.41, 0.54, 0.43, 1.73, 2.7, 0.69, 0.32, 0.92, 1.36, 0.17, 0.44, 1.73, 1.59, 0.34, 5.95, 0.93, 1.32, 0.01, 2.27, 0.63, 1.09, 0.66, 0.04, 1.25, 0.11, 0.98, 0.83, 3.95, 1.51, 1.4, 4.11, 4.02, 8.35, -0.06, 0.86, 0.94, 0.9, 4.06, 1.6, 2.85]} \ No newline at end of file diff --git a/annotations_filtered/wHSH-NpCQOw_filtered.json b/annotations_filtered/wHSH-NpCQOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..685bc1a44c20536d9fb278bddbc4e9c6df6dcf0b --- /dev/null +++ b/annotations_filtered/wHSH-NpCQOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.62], [5.0, 7.6], [9.0, 9.78], [13.0, 13.91], [17.0, 17.49], [19.0, 22.13], [22.0, 23.19], [28.0, 29.07], [31.0, 31.51], [34.0, 34.59], [39.0, 39.02], [46.0, 47.21], [49.0, 51.43], [52.0, 54.31], [56.0, 59.46], [60.0, 63.75], [69.0, 72.44], [77.0, 78.17], [90.0, 90.09], [98.0, 98.66], [100.0, 104.77], [106.0, 108.82], [110.0, 111.62], [112.0, 116.7], [118.0, 119.97], [122.0, 122.47], [124.0, 127.33]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.56, 61.67, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 96.89, 90.78, 86.27, 62.17, 0.0, 0.0, 0.0, 97.43, 95.37, 0.0, 49.78, 0.0, 0.0, 83.88], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 34.15], ["speech", 14.51], ["sidetone", 13.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.59], ["hum", 11.29], ["telephone", 11.03]], null, null, null], "duration": [2.62, 2.6, 0.78, 0.91, 0.49, 3.13, 1.19, 1.07, 0.51, 0.59, 0.02, 1.21, 2.43, 2.31, 3.46, 3.75, 3.44, 1.17, 0.09, 0.66, 4.77, 2.82, 1.62, 4.7, 1.97, 0.47, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/wHfXZ9jcX3A_filtered.json b/annotations_filtered/wHfXZ9jcX3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6729513a8811c77ea6cbf5e7fa4129306fa57de5 --- /dev/null +++ b/annotations_filtered/wHfXZ9jcX3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.68], [15.0, 22.38], [23.0, 30.4], [33.0, 46.35], [47.0, 54.3], [58.0, 58.5], [60.0, 64.94], [66.0, 66.61], [74.0, 75.69], [79.0, 79.32], [81.0, 81.65], [83.0, 97.38], [100.0, 102.63], [105.0, 112.9], [114.0, 134.81], [136.0, 136.05], [138.0, 138.96], [141.0, 144.29], [145.0, 147.63], [149.0, 160.27], [161.0, 161.57], [162.0, 163.71]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false], "silence_prob": [29.37, 29.57, 29.65, 29.93, 30.02, 0.0, 30.37, 0.0, 0.0, 0.0, 0.0, 31.66, 30.4, 30.4, 30.75, 0.0, 0.0, 30.01, 31.03, 29.77, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.14], ["noise", 10.04], ["hum", 6.99]], [["speech", 31.35], ["explosion", 12.62], ["music", 9.22]], [["speech", 52.73], ["vehicle", 19.48], ["car", 12.76]], [["speech", 30.87], ["music", 30.85], ["vehicle", 7.04]], [["throbbing", 61.18], ["music", 22.91], ["hum", 8.33]], null, [["music", 79.47], ["throbbing", 3.35], ["hum", 2.46]], null, null, null, null, [["music", 42.47], ["speech", 24.34], ["hum", 12.6]], [["race car, auto racing", 20.08], ["vehicle", 18.43], ["skidding", 16.75]], [["music", 24.85], ["mains hum", 21.96], ["hum", 17.03]], [["music", 51.91], ["car", 7.65], ["vehicle", 4.52]], null, null, [["music", 39.49], ["hum", 13.18], ["cacophony", 9.7]], [["mains hum", 16.53], ["buzz", 15.82], ["hum", 12.49]], [["throbbing", 32.46], ["hum", 26.05], ["mains hum", 17.07]], null, null], "duration": [3.68, 7.38, 7.4, 13.35, 7.3, 0.5, 4.94, 0.61, 1.69, 0.32, 0.65, 14.38, 2.63, 7.9, 20.81, 0.05, 0.96, 3.29, 2.63, 11.27, 0.57, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/wHqQzF4JXdE_filtered.json b/annotations_filtered/wHqQzF4JXdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b12f3b83cc04554bedaf8bf49f572957e0d61d21 --- /dev/null +++ b/annotations_filtered/wHqQzF4JXdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 44.27], [46.0, 121.29], [125.0, 125.81], [127.0, 128.38], [129.0, 130.37], [133.0, 133.54], [139.0, 139.6], [141.0, 142.06], [149.0, 150.09], [152.0, 152.46], [155.0, 156.36], [157.0, 162.14], [172.0, 173.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.63], ["music", 13.75], ["whale vocalization", 9.55]], null], "duration": [38.27, 75.29, 0.81, 1.38, 1.37, 0.54, 0.6, 1.06, 1.09, 0.46, 1.36, 5.14, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/wI1LRBDvSFs_filtered.json b/annotations_filtered/wI1LRBDvSFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eba56edeee4b59447ddbeb6f31ee2ca8045725ab --- /dev/null +++ b/annotations_filtered/wI1LRBDvSFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.12], [38.0, 38.53], [44.0, 44.44], [46.0, 46.47], [59.0, 59.1], [60.0, 60.89], [64.0, 65.25], [67.0, 68.84], [70.0, 70.02], [71.0, 71.46], [75.0, 76.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [6.12, 0.53, 0.44, 0.47, 0.1, 0.89, 1.25, 1.84, 0.02, 0.46, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/wICMOVrSal0_filtered.json b/annotations_filtered/wICMOVrSal0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2322737bbce0d94bb0230488ed4f0a91fba2b60c --- /dev/null +++ b/annotations_filtered/wICMOVrSal0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.47], [24.0, 24.98], [26.0, 27.36], [29.0, 29.84], [36.0, 38.1], [50.0, 52.46], [57.0, 61.67], [67.0, 67.8], [68.0, 71.09], [84.0, 84.54], [88.0, 89.06], [90.0, 91.03], [108.0, 116.06], [123.0, 123.16], [126.0, 126.79]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false, true, false, false], "silence_prob": [55.96, 0.0, 0.0, 0.0, 45.88, 42.22, 35.16, 0.0, 35.23, 0.0, 0.0, 0.0, 38.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 17.09], ["music", 12.0], ["throbbing", 11.26]], [["clang", 9.61], ["ding", 8.73], ["domestic animals, pets", 8.14]], [["speech", 41.16], ["music", 6.6], ["fly, housefly", 5.58]], null, [["fly, housefly", 43.2], ["insect", 21.3], ["mosquito", 15.09]], null, null, null, [["speech", 44.88], ["buzz", 9.96], ["throbbing", 3.97]], null, null], "duration": [4.47, 0.98, 1.36, 0.84, 2.1, 2.46, 4.67, 0.8, 3.09, 0.54, 1.06, 1.03, 8.06, 0.16, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/wIb3cRvQYw8_filtered.json b/annotations_filtered/wIb3cRvQYw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5a992fddadc0a4b3152ddd5697c07f5b8abb52 --- /dev/null +++ b/annotations_filtered/wIb3cRvQYw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.32], [27.0, 26.84], [35.0, 35.4], [60.0, 60.69], [62.0, 61.77], [77.0, 77.9], [80.0, 79.88], [91.0, 91.02], [93.0, 93.12], [94.0, 95.32], [118.0, 118.45], [140.0, 140.54], [149.0, 148.86], [166.0, 166.38], [170.0, 171.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, -0.16, 0.4, 0.69, -0.23, 0.9, -0.12, 0.02, 0.12, 1.32, 0.45, 0.54, -0.14, 0.38, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/wIloYFMzS6M_filtered.json b/annotations_filtered/wIloYFMzS6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e34a5f5749884102f1d155d77da4aeec3934a295 --- /dev/null +++ b/annotations_filtered/wIloYFMzS6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[77.0, 104.13], [106.0, 106.74], [108.0, 108.62], [110.0, 110.54], [112.0, 111.94], [112.0, 117.41], [119.0, 118.96], [120.0, 122.08], [126.0, 127.9], [128.0, 129.64], [130.0, 145.29], [146.0, 162.36], [165.0, 173.1], [174.0, 174.23], [174.0, 180.76], [187.0, 187.57], [192.0, 193.68], [195.0, 196.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 100.0, 0.0, 0.0, 99.71, 97.0, 66.27, 0.0, 44.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.46], ["telephone", 7.73], ["music", 5.9]], null, null, null], "duration": [27.13, 0.74, 0.62, 0.54, -0.06, 5.41, -0.04, 2.08, 1.9, 1.64, 15.29, 16.36, 8.1, 0.23, 6.76, 0.57, 1.68, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/wIqMqkMIjEE_filtered.json b/annotations_filtered/wIqMqkMIjEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f446954cf698af360e425041658b6b53ffd9032d --- /dev/null +++ b/annotations_filtered/wIqMqkMIjEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [8.0, 14.52], [16.0, 16.41], [18.0, 18.94], [24.0, 35.53], [45.0, 45.15], [45.0, 52.88], [54.0, 56.22], [57.0, 62.04], [63.0, 66.88], [68.0, 69.7], [71.0, 73.63], [75.0, 85.97], [88.0, 90.64], [98.0, 99.2], [100.0, 114.24]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.02, 0.0, 0.0, 42.39, 0.0, 52.56, 67.0, 63.1, 62.37, 0.0, 72.75, 48.27, 54.63, 0.0, 48.14], "audiomae_on_audioset": [null, null, null, null, [["music", 22.73], ["breaking", 19.31], ["hum", 8.97]], null, null, null, null, null, null, null, [["music", 71.4], ["didgeridoo", 11.46], ["musical instrument", 3.56]], null, null, [["music", 72.34], ["didgeridoo", 17.27], ["throbbing", 1.28]]], "duration": [0.58, 6.52, 0.41, 0.94, 11.53, 0.15, 7.88, 2.22, 5.04, 3.88, 1.7, 2.63, 10.97, 2.64, 1.2, 14.24]} \ No newline at end of file diff --git a/annotations_filtered/wIrUoTYd9hA_filtered.json b/annotations_filtered/wIrUoTYd9hA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..268c24dbb90799b777e66a76d3dea7636d46afa4 --- /dev/null +++ b/annotations_filtered/wIrUoTYd9hA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 42.16], [43.0, 44.83], [46.0, 45.99], [46.0, 46.04], [46.0, 46.74], [54.0, 54.67], [56.0, 57.32], [58.0, 59.21], [62.0, 62.28], [68.0, 69.06], [72.0, 72.06], [74.0, 74.53], [77.0, 77.3], [80.0, 80.99], [83.0, 84.77], [86.0, 87.08], [89.0, 91.93], [94.0, 95.35], [96.0, 98.1], [100.0, 100.97], [102.0, 102.39], [103.0, 104.73], [108.0, 107.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [36.16, 1.83, -0.01, 0.04, 0.74, 0.67, 1.32, 1.21, 0.28, 1.06, 0.06, 0.53, 0.3, 0.99, 1.77, 1.08, 2.93, 1.35, 2.1, 0.97, 0.39, 1.73, -0.43]} \ No newline at end of file diff --git a/annotations_filtered/wJCqOhdzatA_filtered.json b/annotations_filtered/wJCqOhdzatA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ff60a2b58d40d82aab79895b33016f2981d6d4c --- /dev/null +++ b/annotations_filtered/wJCqOhdzatA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.69], [17.0, 17.19], [21.0, 22.55], [25.0, 25.24], [26.0, 30.23], [32.0, 33.99], [37.0, 37.57], [42.0, 43.43], [44.0, 44.54], [45.0, 45.91], [48.0, 48.34], [51.0, 53.64], [55.0, 59.39], [60.0, 61.35], [63.0, 67.29], [68.0, 74.68], [77.0, 78.02], [80.0, 80.62], [82.0, 83.27], [84.0, 84.79], [87.0, 88.28], [90.0, 90.26], [95.0, 97.53], [101.0, 101.06], [122.0, 122.54], [124.0, 124.58], [126.0, 127.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 78.72, 0.0, 93.29, 41.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 40.12], ["speech", 37.13], ["radio", 10.67]], null, null, null, null, null, null, [["speech", 54.83], ["sine wave", 11.97], ["chirp tone", 11.5]], null, null, null, [["speech", 49.6], ["fart", 25.82], ["stomach rumble", 5.58]], null, null, null, null, null, null, [["speech", 57.94], ["dial tone", 17.14], ["busy signal", 6.57]], null, null, null, null], "duration": [1.69, 0.19, 1.55, 0.24, 4.23, 1.99, 0.57, 1.43, 0.54, 0.91, 0.34, 2.64, 4.39, 1.35, 4.29, 6.68, 1.02, 0.62, 1.27, 0.79, 1.28, 0.26, 2.53, 0.06, 0.54, 0.58, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/wJJ2RLLVzcU_filtered.json b/annotations_filtered/wJJ2RLLVzcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ddf08ff2431258aaafff1e38a036719acde92c0 --- /dev/null +++ b/annotations_filtered/wJJ2RLLVzcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.89], [25.0, 25.69], [29.0, 29.15], [44.0, 44.88], [46.0, 46.14], [48.0, 52.89], [54.0, 53.74], [60.0, 60.24], [63.0, 62.7], [63.0, 63.39], [64.0, 64.57], [65.0, 66.43], [69.0, 69.26], [71.0, 71.93], [75.0, 74.83], [79.0, 79.41], [81.0, 81.7], [85.0, 86.39], [87.0, 92.26], [94.0, 94.66], [100.0, 99.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.69, 0.15, 0.88, 0.14, 4.89, -0.26, 0.24, -0.3, 0.39, 0.57, 1.43, 0.26, 0.93, -0.17, 0.41, 0.7, 1.39, 5.26, 0.66, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/wJJDM675Ypw_filtered.json b/annotations_filtered/wJJDM675Ypw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d93e98991cd87653ca4a7bb5c7b5f804be08123 --- /dev/null +++ b/annotations_filtered/wJJDM675Ypw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 56.42], [59.0, 78.06], [79.0, 85.08], [87.0, 87.42], [91.0, 93.43], [94.0, 99.54], [104.0, 111.55], [117.0, 118.99]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 39.28, 54.43, 0.0, 98.36, 33.81, 57.25, 0.0], "audiomae_on_audioset": [null, [["throbbing", 38.91], ["hum", 37.04], ["mains hum", 7.01]], null, null, null, [["animal", 23.53], ["whale vocalization", 10.31], ["cattle, bovinae", 6.07]], null, null], "duration": [30.42, 19.06, 6.08, 0.42, 2.43, 5.54, 7.55, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/wJZHc5SJ9eE_filtered.json b/annotations_filtered/wJZHc5SJ9eE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8fc5506e25f5f0af7102c2e78318bcdf46cf29d --- /dev/null +++ b/annotations_filtered/wJZHc5SJ9eE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.79], [7.0, 22.84], [25.0, 39.51], [44.0, 95.12], [99.0, 111.84], [112.0, 114.76]], "keep_status": [false, true, true, false, true, false], "silence_prob": [0.0, 33.03, 31.9, 0.0, 31.22, 31.86], "audiomae_on_audioset": [null, [["music", 42.98], ["fly, housefly", 9.7], ["mosquito", 8.58]], [["speech", 61.77], ["vehicle", 3.7], ["outside, rural or natural", 3.46]], null, [["music", 50.92], ["whip", 3.8], ["speech", 3.24]], [["cattle, bovinae", 49.24], ["moo", 19.93], ["livestock, farm animals, working animals", 16.04]]], "duration": [-0.21, 15.84, 14.51, 51.12, 12.84, 2.76]} \ No newline at end of file diff --git a/annotations_filtered/wJZP20y0R2Q_filtered.json b/annotations_filtered/wJZP20y0R2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19d24ba92b686cc0ea4f4cf7bde600c615e86f8 --- /dev/null +++ b/annotations_filtered/wJZP20y0R2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.34], [27.0, 29.49], [34.0, 44.73], [48.0, 63.78], [70.0, 70.75], [72.0, 72.2], [74.0, 74.04], [85.0, 85.7], [86.0, 91.66], [92.0, 108.9], [109.0, 109.68], [111.0, 111.52], [112.0, 114.15], [119.0, 119.77], [120.0, 136.24], [146.0, 146.58], [151.0, 151.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 39.78, 33.03, 31.65, 0.0, 0.0, 0.0, 0.0, 94.07, 33.64, 0.0, 0.0, 31.3, 0.0, 31.16, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.41], ["hum", 10.86], ["speech", 10.42]], [["music", 81.59], ["speech", 3.47], ["radio", 1.32]], [["music", 62.58], ["speech", 16.87], ["buzz", 1.59]], null, null, null, null, null, [["music", 72.15], ["synthesizer", 8.22], ["electronic music", 2.69]], null, null, [["music", 62.77], ["didgeridoo", 3.23], ["electronic music", 2.09]], null, [["music", 76.44], ["didgeridoo", 4.15], ["musical instrument", 1.57]], null, null], "duration": [0.34, 2.49, 10.73, 15.78, 0.75, 0.2, 0.04, 0.7, 5.66, 16.9, 0.68, 0.52, 2.15, 0.77, 16.24, 0.58, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/wJmIEj-uVYk_filtered.json b/annotations_filtered/wJmIEj-uVYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..306cf1138feebc983913fcb831727c11b241c747 --- /dev/null +++ b/annotations_filtered/wJmIEj-uVYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.13], [9.0, 9.39], [12.0, 15.28], [16.0, 16.73], [37.0, 37.77], [43.0, 43.66], [59.0, 60.18], [62.0, 62.5], [68.0, 67.76], [70.0, 71.73], [73.0, 73.77], [82.0, 82.7], [91.0, 92.21], [94.0, 94.02], [96.0, 96.04], [97.0, 97.19], [99.0, 99.45], [106.0, 105.73], [106.0, 106.78], [112.0, 112.97], [114.0, 114.22], [121.0, 121.41], [136.0, 136.93], [138.0, 139.28], [141.0, 141.17], [147.0, 148.0], [156.0, 155.93], [157.0, 157.54], [158.0, 159.36], [164.0, 165.5], [167.0, 169.91], [172.0, 172.49], [174.0, 175.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["dishes, pots, and pans", 34.27], ["speech", 31.59], ["cutlery, silverware", 14.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["squish", 21.99], ["drip", 15.11], ["hum", 12.24]], null, null], "duration": [0.13, 0.39, 3.28, 0.73, 0.77, 0.66, 1.18, 0.5, -0.24, 1.73, 0.77, 0.7, 1.21, 0.02, 0.04, 0.19, 0.45, -0.27, 0.78, 0.97, 0.22, 0.41, 0.93, 1.28, 0.17, 1.0, -0.07, 0.54, 1.36, 1.5, 2.91, 0.49, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/wJnVVC4784c_filtered.json b/annotations_filtered/wJnVVC4784c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..899db6267d5a3acb4111ebcaae181d638292dbbb --- /dev/null +++ b/annotations_filtered/wJnVVC4784c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.38], [24.0, 24.66], [25.0, 31.45], [38.0, 39.31], [40.0, 42.67], [53.0, 54.63], [57.0, 58.55]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.91, 0.0, 31.32, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.72], ["speech", 35.55], ["throbbing", 3.44]], null, [["music", 58.41], ["hum", 8.43], ["throbbing", 6.25]], null, null], "duration": [1.38, 0.66, 6.45, 1.31, 2.67, 1.63, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/wKIL7__ybL0_filtered.json b/annotations_filtered/wKIL7__ybL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58e3537e7b4dbadca8498e0f4df64b2d65c16940 --- /dev/null +++ b/annotations_filtered/wKIL7__ybL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.17], [7.0, 8.46], [11.0, 13.26], [16.0, 22.06], [25.0, 43.78], [45.0, 45.17], [47.0, 51.97], [55.0, 58.41], [63.0, 63.88], [65.0, 78.06], [79.0, 109.61], [111.0, 126.45]], "keep_status": [false, false, true, true, true, false, true, true, false, true, false, false], "silence_prob": [37.81, 0.0, 31.63, 30.46, 31.99, 0.0, 31.08, 45.95, 0.0, 31.03, 0.0, 31.17], "audiomae_on_audioset": [[["music", 64.41], ["musical instrument", 3.66], ["guitar", 3.08]], null, [["music", 14.19], ["boing", 10.56], ["hum", 5.91]], [["music", 24.25], ["throbbing", 9.58], ["hum", 7.8]], [["music", 34.4], ["speech", 8.53], ["fart", 3.74]], null, [["music", 49.7], ["speech", 12.24], ["didgeridoo", 7.44]], [["cattle, bovinae", 22.41], ["music", 15.5], ["livestock, farm animals, working animals", 13.76]], null, [["music", 32.37], ["speech", 12.87], ["fart", 3.13]], null, [["music", 72.58], ["didgeridoo", 6.1], ["synthesizer", 4.85]]], "duration": [2.17, 1.46, 2.26, 6.06, 18.78, 0.17, 4.97, 3.41, 0.88, 13.06, 30.61, 15.45]} \ No newline at end of file diff --git a/annotations_filtered/wKPbi9oL5xU_filtered.json b/annotations_filtered/wKPbi9oL5xU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6207bb143f97d60aea408e4e26324abe218c0ecb --- /dev/null +++ b/annotations_filtered/wKPbi9oL5xU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.27], [25.0, 25.71], [28.0, 30.21], [31.0, 32.58], [36.0, 36.39], [37.0, 39.06], [40.0, 40.76], [42.0, 43.78], [45.0, 45.77], [47.0, 49.69], [51.0, 53.08], [54.0, 67.04], [67.0, 67.1], [68.0, 84.74], [85.0, 135.84], [137.0, 137.12], [137.0, 139.78], [140.0, 152.1], [153.0, 154.9], [155.0, 160.05], [160.0, 166.5], [168.0, 169.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.36, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 64.97, 100.0, 100.0, 0.0, 99.05, 0.0, 0.0, 91.81, 78.89, 0.0, 99.96, 77.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.71, 2.21, 1.58, 0.39, 2.06, 0.76, 1.78, 0.77, 2.69, 2.08, 13.04, 0.1, 16.74, 50.84, 0.12, 2.78, 12.1, 1.9, 5.05, 6.5, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/wKiW5OYjels_filtered.json b/annotations_filtered/wKiW5OYjels_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327e00660f70a55abfb32584788b1a647ff6e93a --- /dev/null +++ b/annotations_filtered/wKiW5OYjels_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.3], [3.0, 6.94], [8.0, 8.34], [11.0, 12.24], [27.0, 27.13], [34.0, 35.28], [36.0, 36.37], [44.0, 57.96], [60.0, 61.06], [62.0, 63.12], [65.0, 71.68], [72.0, 72.79], [75.0, 76.01], [80.0, 82.8], [92.0, 92.99], [94.0, 97.5], [98.0, 100.41], [101.0, 102.83], [105.0, 107.23], [108.0, 108.97], [110.0, 111.3], [112.0, 113.68], [120.0, 120.56], [125.0, 128.21]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.66, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 97.54, 0.0, 0.0, 95.23, 0.0, 99.71, 96.29, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [[["music", 29.66], ["speech", 15.65], ["cattle, bovinae", 8.63]], [["mains hum", 33.28], ["hum", 14.74], ["electric shaver, electric razor", 11.28]], null, null, null, null, null, [["music", 72.44], ["electronic music", 6.86], ["throbbing", 2.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.3, 3.94, 0.34, 1.24, 0.13, 1.28, 0.37, 13.96, 1.06, 1.12, 6.68, 0.79, 1.01, 2.8, 0.99, 3.5, 2.41, 1.83, 2.23, 0.97, 1.3, 1.68, 0.56, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/wLGpzRMJsVE_filtered.json b/annotations_filtered/wLGpzRMJsVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50a57f094954ca21a98c1b22a67cb534482a16d --- /dev/null +++ b/annotations_filtered/wLGpzRMJsVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [7.0, 8.45], [12.0, 12.55], [15.0, 14.77], [17.0, 17.46], [20.0, 21.19], [26.0, 27.21], [27.0, 29.3], [33.0, 48.27], [49.0, 49.25], [52.0, 52.74], [53.0, 86.88], [89.0, 96.89], [98.0, 124.19], [139.0, 139.68]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.07, 29.5, 0.0, 0.0, 0.0, 28.48, 28.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["frog", 23.07], ["hum", 21.37], ["rumble", 8.97]], [["mains hum", 42.1], ["hum", 29.08], ["throbbing", 10.04]], null, null, null, [["speech", 35.91], ["music", 22.13], ["whale vocalization", 5.07]], [["music", 61.66], ["didgeridoo", 20.08], ["synthesizer", 4.25]], null], "duration": [0.78, 1.45, 0.55, -0.23, 0.46, 1.19, 1.21, 2.3, 15.27, 0.25, 0.74, 33.88, 7.89, 26.19, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/wLuRwDl3MrE_filtered.json b/annotations_filtered/wLuRwDl3MrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e891d406794db68f990a612cdc38fef14c43417 --- /dev/null +++ b/annotations_filtered/wLuRwDl3MrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [8.0, 9.07], [11.0, 12.01], [15.0, 15.67], [19.0, 20.75], [29.0, 33.76], [39.0, 39.01], [48.0, 48.02], [52.0, 55.56], [60.0, 60.84], [71.0, 72.82], [84.0, 85.48], [94.0, 94.0], [99.0, 99.23], [114.0, 116.14], [122.0, 122.64], [131.0, 131.14], [140.0, 141.37], [150.0, 150.31], [159.0, 159.53], [165.0, 165.3], [167.0, 167.26]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.43, 0.0, 0.0, 31.62, 0.0, 0.0, 0.0, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 32.03], ["music", 22.81], ["throbbing", 10.69]], null, null, [["music", 41.85], ["hum", 16.17], ["mains hum", 7.32]], null, null, null, null, null, [["music", 29.57], ["marimba, xylophone", 10.65], ["musical instrument", 9.34]], null, null, null, null, null, null, null], "duration": [0.24, 1.07, 1.01, 0.67, 1.75, 4.76, 0.01, 0.02, 3.56, 0.84, 1.82, 1.48, 0.0, 0.23, 2.14, 0.64, 0.14, 1.37, 0.31, 0.53, 0.3, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/wM2NQimHkTY_filtered.json b/annotations_filtered/wM2NQimHkTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d6cd5ea94a294c8027dd195b4706ebce57a9b20 --- /dev/null +++ b/annotations_filtered/wM2NQimHkTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [5.0, 5.76], [7.0, 7.21], [12.0, 11.89], [17.0, 17.52], [18.0, 17.93], [18.0, 18.57], [22.0, 22.27], [23.0, 25.39], [27.0, 27.11], [29.0, 29.37], [32.0, 33.29], [37.0, 37.49], [40.0, 40.49], [41.0, 41.39], [42.0, 43.68], [44.0, 44.73], [48.0, 48.49], [59.0, 59.04], [60.0, 61.57], [67.0, 68.69], [70.0, 70.56], [73.0, 76.44], [77.0, 77.58], [81.0, 81.18], [85.0, 85.48], [88.0, 88.8], [90.0, 92.31], [93.0, 95.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 47.39, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["baby laughter", 33.43], ["speech", 28.01], ["laughter", 18.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.98], ["inside, small room", 1.99], ["stomach rumble", 1.49]], null, null, null, null, [["speech", 53.24], ["inside, small room", 4.58], ["boiling", 1.7]], null], "duration": [0.57, 0.76, 0.21, -0.11, 0.52, -0.07, 0.57, 0.27, 2.39, 0.11, 0.37, 1.29, 0.49, 0.49, 0.39, 1.68, 0.73, 0.49, 0.04, 1.57, 1.69, 0.56, 3.44, 0.58, 0.18, 0.48, 0.8, 2.31, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/wM5rRXQZvjU_filtered.json b/annotations_filtered/wM5rRXQZvjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..170014aa540a244fad8715c14ebfc08fd8b7416d --- /dev/null +++ b/annotations_filtered/wM5rRXQZvjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 31.4], [37.0, 37.5], [39.0, 41.77], [46.0, 46.65], [49.0, 49.87], [52.0, 55.93], [58.0, 58.02], [60.0, 61.96], [63.0, 66.21], [70.0, 70.26], [77.0, 116.99], [117.0, 128.66]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [29.98, 0.0, 55.04, 0.0, 0.0, 42.65, 0.0, 0.0, 30.59, 0.0, 0.0, 31.12], "audiomae_on_audioset": [[["music", 35.79], ["fly, housefly", 13.21], ["speech", 10.76]], null, null, null, null, [["music", 27.98], ["speech", 11.06], ["hum", 9.42]], null, null, [["music", 43.66], ["hum", 8.15], ["throbbing", 5.6]], null, null, [["noise", 40.21], ["music", 11.62], ["sound effect", 4.93]]], "duration": [12.4, 0.5, 2.77, 0.65, 0.87, 3.93, 0.02, 1.96, 3.21, 0.26, 39.99, 11.66]} \ No newline at end of file diff --git a/annotations_filtered/wMZ5UJRpxfk_filtered.json b/annotations_filtered/wMZ5UJRpxfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfc2895f4b42b8c44523fafbd6dd1aed9dd51c8c --- /dev/null +++ b/annotations_filtered/wMZ5UJRpxfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 30.92], [35.0, 39.75], [40.0, 40.63], [43.0, 44.63], [52.0, 58.9], [61.0, 62.75], [67.0, 68.37], [69.0, 79.3], [81.0, 80.77], [83.0, 85.83]], "keep_status": [true, true, false, false, false, false, false, true, false, false], "silence_prob": [32.15, 43.98, 0.0, 0.0, 53.34, 0.0, 0.0, 32.54, 0.0, 34.18], "audiomae_on_audioset": [[["music", 22.62], ["mains hum", 6.87], ["speech", 6.78]], [["speech", 26.66], ["cattle, bovinae", 18.37], ["moo", 17.76]], null, null, null, null, null, [["music", 29.04], ["speech", 25.13], ["buzz", 5.31]], null, [["hum", 34.07], ["music", 33.26], ["mains hum", 14.01]]], "duration": [24.92, 4.75, 0.63, 1.63, 6.9, 1.75, 1.37, 10.3, -0.23, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/wMgKj3QGv2o_filtered.json b/annotations_filtered/wMgKj3QGv2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0af31238f3e72510487bf39eeede44ddd9ea5c2c --- /dev/null +++ b/annotations_filtered/wMgKj3QGv2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.86], [8.0, 37.39], [42.0, 62.13], [66.0, 76.6], [82.0, 82.11], [82.0, 83.13], [85.0, 87.83], [89.0, 108.67], [111.0, 111.87], [113.0, 154.47], [155.0, 155.92], [161.0, 162.08], [171.0, 170.82], [172.0, 174.87]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.83, 30.75, 30.31, 0.0, 0.0, 30.34, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 31.85], "audiomae_on_audioset": [null, [["music", 73.5], ["didgeridoo", 3.62], ["quack", 2.71]], [["music", 68.23], ["speech", 10.91], ["synthesizer", 3.84]], [["music", 73.41], ["speech", 9.5], ["didgeridoo", 2.41]], null, null, [["music", 16.02], ["fly, housefly", 11.94], ["whack, thwack", 11.44]], [["music", 56.95], ["didgeridoo", 6.8], ["speech", 6.27]], null, null, null, null, null, [["speech", 49.52], ["vehicle", 12.38], ["engine", 5.29]]], "duration": [0.86, 29.39, 20.13, 10.6, 0.11, 1.13, 2.83, 19.67, 0.87, 41.47, 0.92, 1.08, -0.18, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/wMr2d10-xf0_filtered.json b/annotations_filtered/wMr2d10-xf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cdcfd8eea68ae665709000c297a1de80317a1af --- /dev/null +++ b/annotations_filtered/wMr2d10-xf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.23], [10.0, 21.27], [30.0, 33.52], [35.0, 34.97], [36.0, 36.9], [40.0, 41.5], [43.0, 47.07], [49.0, 49.54], [51.0, 52.62], [54.0, 54.19], [56.0, 61.62], [63.0, 69.2], [77.0, 79.3], [86.0, 86.8], [91.0, 105.97], [111.0, 117.36], [122.0, 125.04], [136.0, 138.57], [142.0, 142.52], [144.0, 151.97]], "keep_status": [true, false, true, false, false, false, true, false, false, false, true, true, true, false, false, true, true, true, false, false], "silence_prob": [29.08, 28.76, 28.97, 0.0, 0.0, 0.0, 29.65, 0.0, 0.0, 0.0, 30.11, 29.73, 29.83, 0.0, 28.89, 29.28, 29.56, 33.19, 0.0, 28.78], "audiomae_on_audioset": [[["music", 29.03], ["speech", 22.34], ["foghorn", 17.3]], [["music", 30.35], ["speech", 29.47], ["throbbing", 19.12]], [["music", 27.72], ["speech", 6.06], ["musical instrument", 5.31]], null, null, null, [["music", 43.15], ["didgeridoo", 10.15], ["cattle, bovinae", 3.85]], null, null, null, [["music", 41.58], ["livestock, farm animals, working animals", 6.8], ["moo", 6.18]], [["speech", 37.87], ["hum", 10.3], ["music", 10.25]], [["music", 44.31], ["speech", 18.01], ["boing", 7.53]], null, [["music", 60.52], ["speech", 10.51], ["animal", 4.56]], [["music", 52.19], ["throbbing", 7.69], ["hum", 3.52]], [["speech", 31.37], ["music", 21.72], ["vehicle", 8.18]], [["grunt", 27.98], ["music", 21.58], ["speech", 6.67]], null, [["music", 63.17], ["speech", 11.32], ["didgeridoo", 7.61]]], "duration": [5.23, 11.27, 3.52, -0.03, 0.9, 1.5, 4.07, 0.54, 1.62, 0.19, 5.62, 6.2, 2.3, 0.8, 14.97, 6.36, 3.04, 2.57, 0.52, 7.97]} \ No newline at end of file diff --git a/annotations_filtered/wMvTR012Dmg_filtered.json b/annotations_filtered/wMvTR012Dmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d370c538a133758759fca355644e258fea1642b --- /dev/null +++ b/annotations_filtered/wMvTR012Dmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.55], [8.0, 59.81], [62.0, 106.12]], "keep_status": [false, false, false], "silence_prob": [77.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [2.55, 51.81, 44.12]} \ No newline at end of file diff --git a/annotations_filtered/wN1iAzPTBbM_filtered.json b/annotations_filtered/wN1iAzPTBbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae52102a4c3b25baa7bfe0a30d7b8681f265a159 --- /dev/null +++ b/annotations_filtered/wN1iAzPTBbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.12], [15.0, 14.88], [18.0, 19.75], [23.0, 23.3], [38.0, 38.33], [42.0, 42.42], [44.0, 45.13], [46.0, 47.39], [48.0, 47.7], [52.0, 53.05], [54.0, 54.95], [79.0, 79.86], [88.0, 88.06]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 24.62], ["grunt", 10.55], ["boing", 5.78]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.12, -0.12, 1.75, 0.3, 0.33, 0.42, 1.13, 1.39, -0.3, 1.05, 0.95, 0.86, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/wNRvgeiaVXA_filtered.json b/annotations_filtered/wNRvgeiaVXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ca16dc580679ffa77c9723f9a111f79f87c35d --- /dev/null +++ b/annotations_filtered/wNRvgeiaVXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.77], [14.0, 15.4], [25.0, 25.51], [26.0, 25.88], [33.0, 34.26], [48.0, 48.17], [49.0, 49.59], [54.0, 54.9], [55.0, 57.06], [61.0, 63.02], [80.0, 80.97], [93.0, 93.41], [97.0, 98.64], [111.0, 112.77], [131.0, 134.01], [136.0, 143.24]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.37, 44.6, 0.0, 0.0, 0.0, 0.0, 30.97, 31.05], "audiomae_on_audioset": [[["music", 41.93], ["speech", 5.82], ["musical instrument", 4.6]], null, null, null, null, null, null, null, [["music", 21.35], ["speech", 17.57], ["synthesizer", 11.26]], [["music", 41.06], ["musical instrument", 9.74], ["effects unit", 7.65]], null, null, null, null, [["music", 47.48], ["speech", 6.93], ["yodeling", 4.81]], [["moo", 35.84], ["cattle, bovinae", 31.35], ["livestock, farm animals, working animals", 15.37]]], "duration": [3.77, 1.4, 0.51, -0.12, 1.26, 0.17, 0.59, 0.9, 2.06, 2.02, 0.97, 0.41, 1.64, 1.77, 3.01, 7.24]} \ No newline at end of file diff --git a/annotations_filtered/wNWaYfZI3Ak_filtered.json b/annotations_filtered/wNWaYfZI3Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82d36e485e0e3f922a5c3fe1cff90bc5c9c23dd5 --- /dev/null +++ b/annotations_filtered/wNWaYfZI3Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.52], [23.0, 33.39], [34.0, 35.9], [38.0, 65.94]], "keep_status": [false, false, false, false], "silence_prob": [59.96, 33.94, 0.0, 37.77], "audiomae_on_audioset": [null, [["music", 61.49], ["whale vocalization", 6.56], ["sound effect", 4.15]], null, [["music", 78.22], ["ambient music", 6.18], ["electronic music", 2.52]]], "duration": [20.52, 10.39, 1.9, 27.94]} \ No newline at end of file diff --git a/annotations_filtered/wNWy3YmM3Kw_filtered.json b/annotations_filtered/wNWy3YmM3Kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b58722310dde81901e4f59ecb66b989df0209f6 --- /dev/null +++ b/annotations_filtered/wNWy3YmM3Kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 29.13], [41.0, 40.9], [43.0, 56.91], [61.0, 71.44], [85.0, 85.31], [86.0, 86.17], [86.0, 86.22], [86.0, 87.05], [88.0, 88.79], [92.0, 97.5], [98.0, 98.83], [99.0, 99.79], [100.0, 99.91], [100.0, 99.99], [100.0, 104.14], [111.0, 111.74], [115.0, 117.24], [123.0, 123.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [34.88, 0.0, 67.76, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 33.63, 0.0], "audiomae_on_audioset": [[["music", 51.45], ["didgeridoo", 13.44], ["musical instrument", 6.62]], null, null, null, null, null, null, null, null, [["beatboxing", 16.11], ["whale vocalization", 9.93], ["didgeridoo", 8.68]], null, null, null, null, [["snicker", 51.55], ["chuckle, chortle", 15.35], ["laughter", 10.18]], null, [["whale vocalization", 18.81], ["animal", 16.9], ["speech", 10.02]], null], "duration": [28.13, -0.1, 13.91, 10.44, 0.31, 0.17, 0.22, 1.05, 0.79, 5.5, 0.83, 0.79, -0.09, -0.01, 4.14, 0.74, 2.24, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/wNbKp6IGhrc_filtered.json b/annotations_filtered/wNbKp6IGhrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0816ed8a18ed525b6d2083c1e081f1cb887da2b2 --- /dev/null +++ b/annotations_filtered/wNbKp6IGhrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.44], [3.0, 4.68], [12.0, 11.94], [14.0, 14.96], [17.0, 17.36], [19.0, 22.69], [26.0, 28.48], [29.0, 31.33], [34.0, 35.5], [36.0, 37.15], [37.0, 39.18], [39.0, 41.35], [49.0, 50.23], [52.0, 54.33], [56.0, 57.25], [64.0, 63.76], [66.0, 68.49], [70.0, 89.72], [91.0, 94.12], [96.0, 99.28], [100.0, 107.81], [109.0, 112.92], [115.0, 117.44], [126.0, 127.62], [128.0, 134.69], [136.0, 141.66], [145.0, 146.4], [148.0, 160.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.71, 0.0, 0.0, 0.0, 0.0, 99.99, 97.92, 99.9, 0.0, 0.0, 32.78, 36.65, 0.0, 99.94, 0.0, 0.0, 79.07, 99.91, 99.96, 53.16, 55.81, 99.96, 52.92, 0.0, 98.44, 73.21, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["bow-wow", 30.59], ["bark", 18.82], ["animal", 9.09]], [["sine wave", 28.02], ["sidetone", 25.43], ["speech", 14.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.44, 1.68, -0.06, 0.96, 0.36, 3.69, 2.48, 2.33, 1.5, 1.15, 2.18, 2.35, 1.23, 2.33, 1.25, -0.24, 2.49, 19.72, 3.12, 3.28, 7.81, 3.92, 2.44, 1.62, 6.69, 5.66, 1.4, 12.19]} \ No newline at end of file diff --git a/annotations_filtered/wNibi-NWW4o_filtered.json b/annotations_filtered/wNibi-NWW4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eacea5eb2225e64e8211e4d1078efa1e872c709 --- /dev/null +++ b/annotations_filtered/wNibi-NWW4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.5], [17.0, 17.46], [19.0, 19.84], [21.0, 21.09], [24.0, 24.7], [33.0, 33.27], [36.0, 36.27], [37.0, 46.01], [51.0, 51.92], [53.0, 68.4], [69.0, 90.58], [94.0, 107.55], [109.0, 110.1], [113.0, 114.83], [116.0, 117.19], [119.0, 130.1], [131.0, 132.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 60.32, 94.37, 43.93, 0.0, 0.0, 0.0, 69.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 59.88], ["didgeridoo", 12.14], ["speech", 3.01]], null, null, null, null, null], "duration": [1.5, 0.46, 0.84, 0.09, 0.7, 0.27, 0.27, 9.01, 0.92, 15.4, 21.58, 13.55, 1.1, 1.83, 1.19, 11.1, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/wNqqn5NPJ8k_filtered.json b/annotations_filtered/wNqqn5NPJ8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f0dbfe2e28b1f6140daa3e336d3867eb1ae49ea --- /dev/null +++ b/annotations_filtered/wNqqn5NPJ8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [7.0, 7.53], [8.0, 11.1], [14.0, 15.09], [19.0, 21.27], [24.0, 32.75], [34.0, 35.51], [39.0, 38.7], [39.0, 44.02]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.72, 0.0, 39.6, 35.33, 0.0, 0.0, 45.85], "audiomae_on_audioset": [null, null, null, null, [["burping, eructation", 49.16], ["music", 24.91], ["grunt", 4.41]], [["speech", 62.49], ["music", 21.21], ["burping, eructation", 7.26]], null, null, [["speech", 17.63], ["music", 5.7], ["snicker", 5.03]]], "duration": [0.38, 0.53, 3.1, 1.09, 2.27, 8.75, 1.51, -0.3, 5.02]} \ No newline at end of file diff --git a/annotations_filtered/wO1s5eRplKs_filtered.json b/annotations_filtered/wO1s5eRplKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501c8344e3800b3d1b88883518c5e7688e5c6e63 --- /dev/null +++ b/annotations_filtered/wO1s5eRplKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [3.0, 5.29], [6.0, 8.29], [9.0, 11.48], [13.0, 25.78], [26.0, 56.0], [56.0, 56.81], [58.0, 70.97], [74.0, 88.03], [90.0, 90.53]], "keep_status": [false, false, true, true, false, true, false, true, true, false], "silence_prob": [0.0, 78.38, 39.22, 32.34, 36.25, 35.49, 0.0, 33.78, 30.44, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.9], ["musical instrument", 7.48], ["theremin", 7.07]], [["music", 43.81], ["clarinet", 9.73], ["musical instrument", 8.45]], [["music", 38.93], ["theremin", 26.26], ["singing bowl", 8.39]], [["music", 45.01], ["speech", 19.65], ["musical instrument", 3.8]], null, [["whack, thwack", 26.45], ["basketball bounce", 9.87], ["speech", 6.68]], [["fart", 33.8], ["didgeridoo", 22.11], ["cacophony", 8.75]], null], "duration": [1.51, 2.29, 2.29, 2.48, 12.78, 30.0, 0.81, 12.97, 14.03, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/wO4P6Yz_LZg_filtered.json b/annotations_filtered/wO4P6Yz_LZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..556c902b86c918b6a1171e584b001a952c6a08c8 --- /dev/null +++ b/annotations_filtered/wO4P6Yz_LZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 26.96], [29.0, 34.16], [38.0, 64.77], [76.0, 78.11], [79.0, 79.64], [81.0, 104.68], [107.0, 123.01], [123.0, 147.21], [148.0, 149.18], [150.0, 153.32]], "keep_status": [false, false, true, false, false, false, true, true, false, true], "silence_prob": [66.39, 31.65, 28.99, 55.11, 0.0, 30.16, 42.81, 42.84, 0.0, 41.42], "audiomae_on_audioset": [null, [["music", 51.25], ["noise", 15.05], ["musical instrument", 6.8]], [["throbbing", 26.75], ["music", 26.42], ["hum", 11.97]], null, null, [["hum", 46.0], ["throbbing", 24.67], ["mains hum", 16.24]], [["hum", 28.6], ["whack, thwack", 12.21], ["music", 7.84]], [["chime", 23.45], ["wind chime", 20.64], ["music", 15.31]], null, [["music", 45.51], ["rumble", 8.19], ["hum", 4.63]]], "duration": [11.96, 5.16, 26.77, 2.11, 0.64, 23.68, 16.01, 24.21, 1.18, 3.32]} \ No newline at end of file diff --git a/annotations_filtered/wOSP7YOuOH4_filtered.json b/annotations_filtered/wOSP7YOuOH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2382a606099af23f0e073b32ca4f119847793088 --- /dev/null +++ b/annotations_filtered/wOSP7YOuOH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.18], [0.0, 0.33], [17.0, 18.4], [22.0, 22.84], [31.0, 31.97], [33.0, 33.89], [36.0, 36.44], [44.0, 44.88], [46.0, 47.29], [53.0, 55.05], [56.0, 56.51], [60.0, 60.4], [61.0, 61.64], [64.0, 63.56], [69.0, 70.5], [71.0, 72.66], [73.0, 75.27], [78.0, 78.07], [79.0, 79.74], [82.0, 82.12], [85.0, 87.4], [91.0, 98.2], [103.0, 102.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 39.64, 40.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 46.27], ["didgeridoo", 9.72], ["guitar", 7.32]], null, null, null, null, null, null, [["music", 88.25], ["musical instrument", 2.67], ["guitar", 0.8]], null, null, null, [["music", 73.37], ["musical instrument", 4.11], ["guitar", 2.61]], [["music", 69.08], ["boing", 3.08], ["music for children", 2.73]], null], "duration": [0.18, 0.33, 1.4, 0.84, 0.97, 0.89, 0.44, 0.88, 1.29, 2.05, 0.51, 0.4, 0.64, -0.44, 1.5, 1.66, 2.27, 0.07, 0.74, 0.12, 2.4, 7.2, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/wOp2t0IKnUo_filtered.json b/annotations_filtered/wOp2t0IKnUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e7b2cb0bea2b68662da7b88be09e327ae0fca42 --- /dev/null +++ b/annotations_filtered/wOp2t0IKnUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.64], [4.0, 4.73], [6.0, 6.22], [8.0, 11.82], [15.0, 14.66], [23.0, 23.62], [26.0, 26.45], [28.0, 29.64], [35.0, 42.74], [44.0, 85.8], [88.0, 87.67], [89.0, 94.64]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.49, 0.0, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 34.66], "audiomae_on_audioset": [null, null, null, [["music", 26.05], ["speech", 14.88], ["radio", 6.08]], null, null, null, null, [["music", 28.98], ["speech", 22.05], ["sidetone", 8.57]], null, null, [["insect", 39.31], ["fly, housefly", 35.47], ["mosquito", 7.47]]], "duration": [1.64, 0.73, 0.22, 3.82, -0.34, 0.62, 0.45, 1.64, 7.74, 41.8, -0.33, 5.64]} \ No newline at end of file diff --git a/annotations_filtered/wOuk6V3Dj5A_filtered.json b/annotations_filtered/wOuk6V3Dj5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b43881801ca70ad9f4b3abd0d663d14080085b91 --- /dev/null +++ b/annotations_filtered/wOuk6V3Dj5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[122.0, 124.01], [128.0, 127.95]], "keep_status": [true, false], "silence_prob": [46.4, 0.0], "audiomae_on_audioset": [[["frog", 18.15], ["crow", 16.06], ["caw", 14.63]], null], "duration": [2.01, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/wOzRG7N8_Ic_filtered.json b/annotations_filtered/wOzRG7N8_Ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f47a3d515d489b8a09a7357f1f70c19ed3c0369 --- /dev/null +++ b/annotations_filtered/wOzRG7N8_Ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [5.0, 5.73], [8.0, 8.63], [11.0, 11.13], [11.0, 11.96], [13.0, 13.41], [15.0, 14.88], [16.0, 16.21], [17.0, 17.42], [20.0, 20.83], [21.0, 23.85], [24.0, 24.95], [27.0, 27.99], [32.0, 33.42], [34.0, 34.91], [36.0, 36.95], [39.0, 39.06], [40.0, 41.94], [43.0, 43.17], [44.0, 43.92], [45.0, 45.79], [47.0, 47.48], [49.0, 49.01], [51.0, 53.91], [55.0, 56.34], [58.0, 64.86], [66.0, 66.5], [67.0, 68.08], [70.0, 76.84], [78.0, 80.13], [81.0, 82.7], [85.0, 85.53], [86.0, 86.8], [89.0, 89.4], [90.0, 90.66], [91.0, 93.16], [94.0, 96.15], [97.0, 97.48], [98.0, 98.25], [99.0, 100.9], [102.0, 104.57], [109.0, 111.23], [113.0, 113.51], [114.0, 114.35], [117.0, 117.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 100.0, 0.0, 0.0, 0.0, 64.75, 76.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.73, 0.63, 0.13, 0.96, 0.41, -0.12, 0.21, 0.42, 0.83, 2.85, 0.95, 0.99, 1.42, 0.91, 0.95, 0.06, 1.94, 0.17, -0.08, 0.79, 0.48, 0.01, 2.91, 1.34, 6.86, 0.5, 1.08, 6.84, 2.13, 1.7, 0.53, 0.8, 0.4, 0.66, 2.16, 2.15, 0.48, 0.25, 1.9, 2.57, 2.23, 0.51, 0.35, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/wPO6KyIYst4_filtered.json b/annotations_filtered/wPO6KyIYst4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3565c5716c597036c5a501ab04a24b44ccc5dc21 --- /dev/null +++ b/annotations_filtered/wPO6KyIYst4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.63], [19.0, 19.95], [26.0, 26.52], [31.0, 31.08], [38.0, 39.24], [41.0, 42.35], [47.0, 49.11], [50.0, 50.45], [50.0, 63.71], [93.0, 96.21], [97.0, 96.74], [99.0, 100.9], [108.0, 109.05], [113.0, 114.3], [116.0, 117.95], [123.0, 124.12], [127.0, 131.46], [134.0, 137.37], [164.0, 166.31], [169.0, 171.51], [178.0, 178.77], [183.0, 183.91], [186.0, 187.98], [193.0, 194.1], [198.0, 198.86], [199.0, 211.91], [214.0, 224.41], [225.0, 225.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [52.56, 0.0, 0.0, 0.0, 0.0, 0.0, 32.4, 0.0, 39.37, 35.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.97, 36.25, 32.31, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 34.7, 38.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 69.1], ["carnatic music", 7.09], ["theremin", 3.4]], null, [["music", 60.84], ["theremin", 8.1], ["musical instrument", 5.51]], [["music", 73.77], ["theremin", 5.64], ["carnatic music", 5.63]], null, null, null, null, null, null, [["music", 54.66], ["speech", 4.36], ["hum", 2.68]], [["music", 51.01], ["synthesizer", 14.22], ["musical instrument", 8.7]], [["music", 73.52], ["theremin", 4.99], ["mantra", 1.87]], [["music", 53.92], ["theremin", 27.65], ["musical instrument", 1.93]], null, null, null, null, null, [["music", 72.88], ["didgeridoo", 3.07], ["speech", 3.06]], [["music", 55.54], ["didgeridoo", 6.84], ["theremin", 5.89]], null], "duration": [3.63, 0.95, 0.52, 0.08, 1.24, 1.35, 2.11, 0.45, 13.71, 3.21, -0.26, 1.9, 1.05, 1.3, 1.95, 1.12, 4.46, 3.37, 2.31, 2.51, 0.77, 0.91, 1.98, 1.1, 0.86, 12.91, 10.41, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/wPSEC3PpLuM_filtered.json b/annotations_filtered/wPSEC3PpLuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c444a9ff8a0d7f9455e6488f6a43ee2bb93af4f --- /dev/null +++ b/annotations_filtered/wPSEC3PpLuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.9], [8.0, 15.53], [16.0, 17.52], [19.0, 21.27], [22.0, 22.06], [22.0, 46.97], [47.0, 47.98], [49.0, 49.59], [51.0, 50.9], [53.0, 52.86], [55.0, 60.93], [62.0, 62.83], [64.0, 64.57], [66.0, 67.31], [68.0, 69.53], [70.0, 74.21], [75.0, 74.92], [77.0, 77.06], [79.0, 79.25], [79.0, 79.29], [82.0, 86.66], [91.0, 92.01], [97.0, 98.91], [103.0, 105.83], [118.0, 120.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 54.9, 0.0, 39.05, 0.0, 34.53, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.1, 45.72], "audiomae_on_audioset": [null, null, null, [["music", 54.0], ["theremin", 12.27], ["musical instrument", 4.85]], null, [["music", 48.47], ["theremin", 19.78], ["musical instrument", 4.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.86], ["boing", 11.8], ["speech", 10.64]]], "duration": [3.9, 7.53, 1.52, 2.27, 0.06, 24.97, 0.98, 0.59, -0.1, -0.14, 5.93, 0.83, 0.57, 1.31, 1.53, 4.21, -0.08, 0.06, 0.25, 0.29, 4.66, 1.01, 1.91, 2.83, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/wPT49WXC0Zo_filtered.json b/annotations_filtered/wPT49WXC0Zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a67fbfb42c796e9f2894a4232faeaaea65c75c0 --- /dev/null +++ b/annotations_filtered/wPT49WXC0Zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.15], [11.0, 12.07], [13.0, 14.07], [16.0, 17.04], [31.0, 31.56], [37.0, 37.72], [39.0, 39.21], [40.0, 40.31], [42.0, 42.82], [45.0, 44.98], [47.0, 49.74], [50.0, 51.65], [56.0, 57.01], [60.0, 62.94], [65.0, 65.94], [67.0, 67.32], [72.0, 72.77], [74.0, 74.21], [75.0, 78.14], [79.0, 80.23], [81.0, 82.14], [83.0, 83.27], [85.0, 85.18], [86.0, 87.1], [89.0, 89.67], [91.0, 91.49], [93.0, 95.23], [97.0, 99.45], [100.0, 101.83], [104.0, 104.72], [106.0, 107.27], [109.0, 108.85], [124.0, 125.05], [127.0, 134.05], [135.0, 134.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 56.03, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 1.07, 1.07, 1.04, 0.56, 0.72, 0.21, 0.31, 0.82, -0.02, 2.74, 1.65, 1.01, 2.94, 0.94, 0.32, 0.77, 0.21, 3.14, 1.23, 1.14, 0.27, 0.18, 1.1, 0.67, 0.49, 2.23, 2.45, 1.83, 0.72, 1.27, -0.15, 1.05, 7.05, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/wPmTp9up26w_filtered.json b/annotations_filtered/wPmTp9up26w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fde655398aec2bb2ab45c3bbff8a0eff9aa9b7d --- /dev/null +++ b/annotations_filtered/wPmTp9up26w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [7.0, 7.52], [8.0, 9.91], [12.0, 12.58], [14.0, 15.62], [17.0, 18.3], [21.0, 21.66], [22.0, 23.84], [29.0, 30.38], [33.0, 33.61], [36.0, 36.24], [39.0, 39.23], [41.0, 49.37], [50.0, 52.2], [54.0, 56.83], [58.0, 57.87], [59.0, 60.76], [61.0, 61.64], [62.0, 64.17], [66.0, 67.36], [68.0, 71.56], [75.0, 76.27], [79.0, 79.34], [80.0, 80.57], [83.0, 84.32], [86.0, 87.29], [88.0, 88.52], [89.0, 90.66], [92.0, 95.28], [96.0, 98.17], [98.0, 101.43], [103.0, 103.62], [105.0, 104.8], [106.0, 110.4], [111.0, 112.41], [113.0, 117.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 98.36, 99.21, 0.0, 0.0, 0.0, 32.73, 0.0, 54.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 54.36, 76.37, 0.0, 0.0, 98.27, 0.0, 41.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 22.74], ["livestock, farm animals, working animals", 20.86], ["cattle, bovinae", 20.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.8], ["hum", 13.49], ["insect", 12.03]]], "duration": [1.23, 0.52, 1.91, 0.58, 1.62, 1.3, 0.66, 1.84, 1.38, 0.61, 0.24, 0.23, 8.37, 2.2, 2.83, -0.13, 1.76, 0.64, 2.17, 1.36, 3.56, 1.27, 0.34, 0.57, 1.32, 1.29, 0.52, 1.66, 3.28, 2.17, 3.43, 0.62, -0.2, 4.4, 1.41, 4.48]} \ No newline at end of file diff --git a/annotations_filtered/wPmgfWpamb0_filtered.json b/annotations_filtered/wPmgfWpamb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c64457c19d32d9db8bff666afa7776d0443e9eb6 --- /dev/null +++ b/annotations_filtered/wPmgfWpamb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.81], [29.0, 30.72], [32.0, 48.56], [50.0, 51.11], [52.0, 53.05], [54.0, 62.75], [74.0, 83.08], [87.0, 87.99], [92.0, 94.83], [97.0, 103.27], [112.0, 115.5]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 44.81, 0.0, 0.0, 42.19, 35.34, 0.0, 84.25, 44.9, 28.99], "audiomae_on_audioset": [null, null, [["music", 43.14], ["hum", 16.99], ["ambient music", 10.44]], null, null, [["music", 71.73], ["ambient music", 5.14], ["theremin", 4.49]], [["music", 34.52], ["hum", 16.02], ["throbbing", 9.54]], null, null, [["speech", 31.19], ["timpani", 12.39], ["music", 6.67]], [["music", 64.95], ["quack", 5.82], ["duck", 2.55]]], "duration": [1.81, 1.72, 16.56, 1.11, 1.05, 8.75, 9.08, 0.99, 2.83, 6.27, 3.5]} \ No newline at end of file diff --git a/annotations_filtered/wQ5uso-R6aY_filtered.json b/annotations_filtered/wQ5uso-R6aY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be70464bc75518c24a987a01f7958a2ea9436839 --- /dev/null +++ b/annotations_filtered/wQ5uso-R6aY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [5.0, 5.53], [7.0, 7.84], [8.0, 9.14], [11.0, 11.58], [13.0, 14.0], [15.0, 15.65], [20.0, 21.05], [22.0, 23.73], [28.0, 29.2], [39.0, 40.39], [42.0, 42.52], [46.0, 46.57], [52.0, 52.12], [55.0, 56.29], [60.0, 60.42], [64.0, 64.72], [69.0, 70.71], [76.0, 76.87], [80.0, 81.19], [84.0, 84.96], [93.0, 94.91], [101.0, 101.39], [103.0, 103.44], [109.0, 112.56], [115.0, 117.39], [118.0, 120.09], [125.0, 125.49], [127.0, 128.85], [130.0, 138.55], [140.0, 141.08], [142.0, 144.48], [145.0, 159.54], [162.0, 165.32], [168.0, 167.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 92.15, 78.72, 0.0, 0.0, 44.57, 0.0, 46.15, 29.89, 31.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.38], ["speech", 8.56], ["musical instrument", 3.04]], null, [["music", 54.91], ["hum", 5.1], ["mains hum", 3.44]], [["music", 30.49], ["electric shaver, electric razor", 15.38], ["speech", 15.3]], [["throbbing", 20.71], ["music", 20.37], ["pulse", 14.95]], null], "duration": [0.64, 0.53, 0.84, 1.14, 0.58, 1.0, 0.65, 1.05, 1.73, 1.2, 1.39, 0.52, 0.57, 0.12, 1.29, 0.42, 0.72, 1.71, 0.87, 1.19, 0.96, 1.91, 0.39, 0.44, 3.56, 2.39, 2.09, 0.49, 1.85, 8.55, 1.08, 2.48, 14.54, 3.32, -0.34]} \ No newline at end of file diff --git a/annotations_filtered/wQc-GpTtnR0_filtered.json b/annotations_filtered/wQc-GpTtnR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92aed9b459e12c1f885b06e71e8ed91558b9383c --- /dev/null +++ b/annotations_filtered/wQc-GpTtnR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [8.0, 8.88], [11.0, 11.79], [17.0, 25.37], [30.0, 30.43], [35.0, 34.84], [47.0, 48.1], [63.0, 63.34], [64.0, 64.34], [67.0, 67.69], [69.0, 70.01], [70.0, 70.56], [77.0, 77.67], [82.0, 82.83], [85.0, 85.65], [89.0, 88.94], [108.0, 108.77], [110.0, 112.89], [114.0, 115.79], [117.0, 120.82], [122.0, 124.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 89.36, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 0.88, 0.79, 8.37, 0.43, -0.16, 1.1, 0.34, 0.34, 0.69, 1.01, 0.56, 0.67, 0.83, 0.65, -0.06, 0.77, 2.89, 1.79, 3.82, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/wQhcRCuORak_filtered.json b/annotations_filtered/wQhcRCuORak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e2ff04cdaaabf31b4d2ce66a0687620bc576569 --- /dev/null +++ b/annotations_filtered/wQhcRCuORak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 7.32], [14.0, 14.18], [16.0, 16.66], [21.0, 22.01], [23.0, 24.44]], "keep_status": [true, false, false, false, false], "silence_prob": [44.69, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.97], ["ding", 9.95], ["clang", 9.77]], null, null, null, null], "duration": [7.32, 0.18, 0.66, 1.01, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/wQj8uFwQP2A_filtered.json b/annotations_filtered/wQj8uFwQP2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b8cf43db9e20026af8e524b9bb3cd15c4d26a68 --- /dev/null +++ b/annotations_filtered/wQj8uFwQP2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [15.0, 16.29], [21.0, 21.57], [24.0, 24.26], [27.0, 26.99], [27.0, 28.44], [29.0, 31.41], [40.0, 40.49], [58.0, 64.2], [72.0, 76.67], [78.0, 81.65], [83.0, 83.35], [87.0, 88.26], [89.0, 90.75], [91.0, 91.3], [99.0, 105.6], [117.0, 127.55]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.5, 0.0, 36.06, 59.96, 51.44, 0.0, 0.0, 0.0, 0.0, 31.06, 31.68], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 41.9], ["speech", 24.29], ["didgeridoo", 3.28]], null, [["moo", 23.71], ["cattle, bovinae", 23.07], ["livestock, farm animals, working animals", 16.52]], null, null, null, null, null, null, [["music", 63.95], ["didgeridoo", 6.7], ["singing", 2.61]], [["music", 35.09], ["speech", 12.85], ["fart", 10.64]]], "duration": [1.12, 1.29, 0.57, 0.26, -0.01, 1.44, 2.41, 0.49, 6.2, 4.67, 3.65, 0.35, 1.26, 1.75, 0.3, 6.6, 10.55]} \ No newline at end of file diff --git a/annotations_filtered/wRN8Q_Lts7k_filtered.json b/annotations_filtered/wRN8Q_Lts7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f46311611dacae5bf687186d0722ce592d5a5670 --- /dev/null +++ b/annotations_filtered/wRN8Q_Lts7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [11.0, 12.45], [13.0, 18.77], [20.0, 20.65], [22.0, 22.77], [23.0, 34.77], [37.0, 37.79], [39.0, 40.41], [41.0, 43.12], [45.0, 48.9], [52.0, 77.43], [80.0, 104.95], [106.0, 107.97]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 73.82, 0.0, 0.0, 62.37, 0.0, 0.0, 51.66, 37.41, 35.59, 89.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 25.38], ["hum", 9.2], ["throbbing", 4.51]], [["music", 46.7], ["didgeridoo", 9.34], ["hum", 5.48]], null, null], "duration": [0.4, 1.45, 5.77, 0.65, 0.77, 11.77, 0.79, 1.41, 2.12, 3.9, 25.43, 24.95, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/wR_e9lxh7Ds_filtered.json b/annotations_filtered/wR_e9lxh7Ds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5185758de67992af46ece4567ef04c26f8ecdd7 --- /dev/null +++ b/annotations_filtered/wR_e9lxh7Ds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [8.0, 8.9], [13.0, 14.94], [16.0, 21.42], [22.0, 25.0], [27.0, 28.21], [32.0, 32.26], [36.0, 36.34], [46.0, 46.68], [52.0, 52.22], [63.0, 66.85], [97.0, 99.05], [101.0, 108.89], [112.0, 114.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.59, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 38.78, 86.64, 54.76, 43.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 24.41], ["cattle, bovinae", 11.22], ["livestock, farm animals, working animals", 9.33]], null, null, [["music", 59.83], ["speech", 24.34], ["musical instrument", 2.52]]], "duration": [0.66, 0.9, 1.94, 5.42, 3.0, 1.21, 0.26, 0.34, 0.68, 0.22, 3.85, 2.05, 7.89, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/wRbKDoyN5oc_filtered.json b/annotations_filtered/wRbKDoyN5oc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4947c1e201adc18efade5d2c99bd5cc4f677d7a3 --- /dev/null +++ b/annotations_filtered/wRbKDoyN5oc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 5.56], [7.0, 8.29], [10.0, 10.32], [11.0, 13.54], [16.0, 16.82], [18.0, 20.22], [21.0, 22.35], [24.0, 24.75], [26.0, 26.57], [29.0, 29.89], [31.0, 31.43], [35.0, 35.72], [38.0, 38.23], [40.0, 40.09], [42.0, 42.16], [43.0, 43.66], [44.0, 45.62], [46.0, 46.38], [47.0, 52.12], [53.0, 54.01], [55.0, 57.11], [58.0, 60.59], [62.0, 72.18], [73.0, 74.17], [76.0, 79.0], [81.0, 82.78], [116.0, 117.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 84.8, 62.89, 0.0, 67.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 1.56, 1.29, 0.32, 2.54, 0.82, 2.22, 1.35, 0.75, 0.57, 0.89, 0.43, 0.72, 0.23, 0.09, 0.16, 0.66, 1.62, 0.38, 5.12, 1.01, 2.11, 2.59, 10.18, 1.17, 3.0, 1.78, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/wReulnRQA-Y_filtered.json b/annotations_filtered/wReulnRQA-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7406b15881f8bc8d0407b074b25ddeda20c40f92 --- /dev/null +++ b/annotations_filtered/wReulnRQA-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 74.51], [75.0, 76.25], [77.0, 76.96], [78.0, 86.22], [88.0, 89.68], [91.0, 91.13], [92.0, 93.02], [98.0, 98.47], [99.0, 100.06], [104.0, 108.9], [112.0, 134.03], [135.0, 136.36], [141.0, 149.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.97, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 33.12, 30.99, 0.0, 38.72], "audiomae_on_audioset": [[["throbbing", 45.5], ["hum", 24.15], ["music", 21.7]], null, null, [["hum", 32.45], ["throbbing", 23.02], ["music", 22.11]], null, null, null, null, null, [["hum", 35.23], ["throbbing", 31.56], ["music", 9.41]], [["speech", 44.7], ["music", 32.75], ["throbbing", 7.45]], null, [["hum", 46.78], ["mains hum", 41.75], ["creak", 1.31]]], "duration": [13.51, 1.25, -0.04, 8.22, 1.68, 0.13, 1.02, 0.47, 1.06, 4.9, 22.03, 1.36, 8.64]} \ No newline at end of file diff --git a/annotations_filtered/wS9RtY8dVpo_filtered.json b/annotations_filtered/wS9RtY8dVpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02e63454b2a6801df6d416e14b3a83c094f25d61 --- /dev/null +++ b/annotations_filtered/wS9RtY8dVpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 35.36], [36.0, 61.1], [62.0, 90.36]], "keep_status": [true, false, true], "silence_prob": [30.47, 32.2, 34.86], "audiomae_on_audioset": [[["music", 26.11], ["cattle, bovinae", 12.41], ["groan", 10.85]], [["music", 36.85], ["mains hum", 22.56], ["hum", 15.42]], [["hum", 33.46], ["buzz", 14.95], ["mains hum", 9.18]]], "duration": [11.36, 25.1, 28.36]} \ No newline at end of file diff --git a/annotations_filtered/wSOMPH85zvQ_filtered.json b/annotations_filtered/wSOMPH85zvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf723f98ecaf533321115bfc8c221251e0fe6d21 --- /dev/null +++ b/annotations_filtered/wSOMPH85zvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.11], [6.0, 6.84], [8.0, 9.63], [11.0, 12.75], [16.0, 19.74], [20.0, 21.41], [27.0, 30.77], [35.0, 38.87], [41.0, 41.17], [44.0, 47.93], [55.0, 57.08], [58.0, 59.58], [65.0, 65.91], [67.0, 67.19], [72.0, 74.31], [84.0, 87.76], [91.0, 100.53], [103.0, 139.8], [141.0, 142.35], [146.0, 148.54], [153.0, 157.99], [164.0, 178.01], [179.0, 205.07], [206.0, 209.85], [210.0, 214.05], [216.0, 223.92], [226.0, 228.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 56.86, 54.76, 0.0, 44.9, 48.69, 0.0, 0.0, 0.0, 34.49, 36.77, 35.88, 0.0, 0.0, 34.42, 34.31, 45.24, 97.11, 96.29, 71.14, 60.79, 74.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 32.36], ["piano", 11.98], ["musical instrument", 10.81]], [["music", 28.69], ["bow-wow", 5.86], ["dog", 5.84]], null, null, null, [["music", 56.38], ["musical instrument", 10.25], ["guitar", 8.02]], [["music", 49.87], ["musical instrument", 10.1], ["piano", 6.34]], [["music", 62.94], ["musical instrument", 5.39], ["guitar", 4.08]], null, null, [["music", 49.36], ["brass instrument", 11.39], ["trombone", 6.19]], [["music", 59.54], ["musical instrument", 6.71], ["synthesizer", 2.79]], [["music", 66.63], ["musical instrument", 3.81], ["keyboard (musical)", 2.59]], null, null, null, null, null], "duration": [1.11, 0.84, 1.63, 1.75, 3.74, 1.41, 3.77, 3.87, 0.17, 3.93, 2.08, 1.58, 0.91, 0.19, 2.31, 3.76, 9.53, 36.8, 1.35, 2.54, 4.99, 14.01, 26.07, 3.85, 4.05, 7.92, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/wSPAPeO17Zk_filtered.json b/annotations_filtered/wSPAPeO17Zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54513b6f1182c9a827b463f5dac422473d5c6e38 --- /dev/null +++ b/annotations_filtered/wSPAPeO17Zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.79], [22.0, 26.3], [35.0, 47.02], [49.0, 52.71], [56.0, 61.82]], "keep_status": [true, true, true, false, true], "silence_prob": [30.92, 30.09, 30.43, 32.09, 30.54], "audiomae_on_audioset": [[["music", 35.32], ["hum", 23.86], ["throbbing", 7.19]], [["vehicle", 19.8], ["car", 17.34], ["music", 15.39]], [["music", 21.16], ["vehicle", 11.11], ["car", 10.95]], [["music", 65.16], ["theremin", 2.91], ["musical instrument", 2.89]], [["sidetone", 23.76], ["music", 21.31], ["mains hum", 17.85]]], "duration": [16.79, 4.3, 12.02, 3.71, 5.82]} \ No newline at end of file diff --git a/annotations_filtered/wSdltnqDWV0_filtered.json b/annotations_filtered/wSdltnqDWV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7a7da89a84ef06d00ab78442b3e2b8b0265f3a9 --- /dev/null +++ b/annotations_filtered/wSdltnqDWV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.31], [9.0, 11.75], [14.0, 15.38], [16.0, 20.41], [21.0, 31.16], [35.0, 39.95], [40.0, 41.69], [44.0, 44.2], [45.0, 45.86], [52.0, 52.39], [58.0, 59.41], [60.0, 60.27], [66.0, 67.19], [72.0, 72.74], [75.0, 75.83], [80.0, 80.43], [85.0, 86.39], [91.0, 93.51], [96.0, 98.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.09, 100.0, 0.0, 61.57, 81.89, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.31, 2.75, 1.38, 4.41, 10.16, 4.95, 1.69, 0.2, 0.86, 0.39, 1.41, 0.27, 1.19, 0.74, 0.83, 0.43, 1.39, 2.51, 2.52]} \ No newline at end of file diff --git a/annotations_filtered/wTGRsKLqkGM_filtered.json b/annotations_filtered/wTGRsKLqkGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9574f8b10fe5671fc2f7f0ec489c0ecff10ca23 --- /dev/null +++ b/annotations_filtered/wTGRsKLqkGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 80.2], [83.0, 83.03], [84.0, 84.54], [92.0, 143.23]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [33.2, 0.03, 0.54, 51.23]} \ No newline at end of file diff --git a/annotations_filtered/wTLo8CdhxGs_filtered.json b/annotations_filtered/wTLo8CdhxGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c057c08cbba4c0162dbc73f390032710735024 --- /dev/null +++ b/annotations_filtered/wTLo8CdhxGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 91.07], [96.0, 98.1], [103.0, 108.6], [109.0, 108.63], [123.0, 122.79], [129.0, 129.52]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.97, 30.73, 29.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.55], ["moo", 7.68], ["cattle, bovinae", 4.09]], [["music", 72.4], ["musical instrument", 3.03], ["salsa music", 2.02]], [["music", 57.55], ["speech", 10.96], ["synthesizer", 2.2]], null, null, null], "duration": [16.07, 2.1, 5.6, -0.37, -0.21, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/wTP_SdjD5ms_filtered.json b/annotations_filtered/wTP_SdjD5ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wTP_SdjD5ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wTf4njh9TnE_filtered.json b/annotations_filtered/wTf4njh9TnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0949aba5eb3acd48751731dda4113158e95b5218 --- /dev/null +++ b/annotations_filtered/wTf4njh9TnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.66], [22.0, 22.89], [26.0, 29.74], [33.0, 35.11], [39.0, 39.75], [43.0, 44.69], [55.0, 55.75], [60.0, 60.42], [62.0, 69.53], [72.0, 72.67], [76.0, 76.84], [78.0, 79.78], [84.0, 87.1], [90.0, 91.88], [94.0, 96.23], [98.0, 98.59], [103.0, 108.28], [110.0, 114.4], [116.0, 118.76], [121.0, 121.39], [126.0, 127.53], [130.0, 131.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [50.31, 0.0, 44.2, 61.67, 0.0, 0.0, 0.0, 0.0, 37.72, 0.0, 0.0, 0.0, 37.59, 0.0, 33.97, 0.0, 34.86, 29.51, 32.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 29.38], ["hum", 26.86], ["music", 22.21]], null, null, null, null, null, [["speech", 33.63], ["bee, wasp, etc.", 9.21], ["insect", 8.78]], null, null, null, [["music", 56.4], ["throbbing", 15.72], ["hum", 8.48]], null, [["hum", 28.09], ["throbbing", 27.37], ["music", 17.39]], null, [["music", 52.39], ["hum", 9.19], ["throbbing", 8.73]], [["fly, housefly", 19.63], ["insect", 14.44], ["bee, wasp, etc.", 10.53]], [["music", 31.4], ["throbbing", 26.12], ["hum", 24.04]], null, null, null], "duration": [11.66, 0.89, 3.74, 2.11, 0.75, 1.69, 0.75, 0.42, 7.53, 0.67, 0.84, 1.78, 3.1, 1.88, 2.23, 0.59, 5.28, 4.4, 2.76, 0.39, 1.53, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/wTfbHs4HlPo_filtered.json b/annotations_filtered/wTfbHs4HlPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1d975516b81052fbe398ddc130539a5bb2b5c01 --- /dev/null +++ b/annotations_filtered/wTfbHs4HlPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [5.0, 5.37], [8.0, 8.56], [11.0, 11.57], [15.0, 16.34], [19.0, 19.04], [20.0, 21.24], [22.0, 24.09], [25.0, 25.41], [26.0, 26.69], [29.0, 29.1], [33.0, 33.94], [39.0, 39.46], [40.0, 51.39], [52.0, 53.47], [55.0, 55.07], [58.0, 58.82], [61.0, 61.72], [63.0, 62.78], [68.0, 71.12], [75.0, 76.54], [78.0, 77.84], [79.0, 79.69], [80.0, 82.93], [87.0, 87.42], [89.0, 89.95], [91.0, 93.58], [95.0, 96.96], [99.0, 103.65], [108.0, 113.83], [114.0, 115.45], [119.0, 120.09], [123.0, 124.87], [127.0, 128.17], [129.0, 130.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 0.0, 0.0, 33.37, 0.0, 0.0, 34.43, 0.0, 33.04, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 16.08], ["sine wave", 14.8], ["whale vocalization", 13.1]], null, null, null, [["music", 32.09], ["speech", 7.46], ["musical instrument", 5.31]], null, null, [["music", 51.91], ["synthesizer", 6.33], ["electronic music", 5.35]], null, [["hum", 26.61], ["speech", 24.87], ["rumble", 11.0]], [["music", 36.01], ["speech", 7.62], ["knock", 5.98]], null, null, null, null, null], "duration": [0.91, 0.37, 0.56, 0.57, 1.34, 0.04, 1.24, 2.09, 0.41, 0.69, 0.1, 0.94, 0.46, 11.39, 1.47, 0.07, 0.82, 0.72, -0.22, 3.12, 1.54, -0.16, 0.69, 2.93, 0.42, 0.95, 2.58, 1.96, 4.65, 5.83, 1.45, 1.09, 1.87, 1.17, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/wTk1noW_8Lo_filtered.json b/annotations_filtered/wTk1noW_8Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c8c776ca069bd6c618723cabe6ea82cac9d8a23 --- /dev/null +++ b/annotations_filtered/wTk1noW_8Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.11], [2.0, 3.21], [4.0, 4.46], [6.0, 6.42], [8.0, 7.86], [9.0, 10.39], [12.0, 12.01], [13.0, 13.41], [14.0, 14.88], [15.0, 18.93], [21.0, 21.14], [24.0, 24.21], [29.0, 29.93], [31.0, 35.26], [40.0, 40.0], [43.0, 49.54], [50.0, 52.44], [53.0, 55.95], [59.0, 61.55], [64.0, 69.55], [70.0, 70.82], [71.0, 71.44], [72.0, 72.47], [73.0, 73.55], [84.0, 100.9], [103.0, 103.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 0.0, 0.0, 0.0, 56.86, 0.0, 54.36, 62.78, 61.37, 63.64, 50.86, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 47.63], ["breaking", 38.1], ["glass", 4.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 1.21, 0.46, 0.42, -0.14, 1.39, 0.01, 0.41, 0.88, 3.93, 0.14, 0.21, 0.93, 4.26, 0.0, 6.54, 2.44, 2.95, 2.55, 5.55, 0.82, 0.44, 0.47, 0.55, 16.9, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/wTqLwoaEUmU_filtered.json b/annotations_filtered/wTqLwoaEUmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51ca80850d053e7713f2e3f47fa64890fc3ee7a0 --- /dev/null +++ b/annotations_filtered/wTqLwoaEUmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.55], [10.0, 14.18], [15.0, 15.89], [16.0, 17.64], [18.0, 22.77], [26.0, 26.55], [28.0, 29.81], [30.0, 30.94], [32.0, 32.09], [34.0, 34.65], [38.0, 39.29], [41.0, 41.71], [42.0, 42.8], [44.0, 44.54], [47.0, 46.7], [49.0, 49.15], [53.0, 54.3], [56.0, 57.37], [58.0, 59.85], [65.0, 68.62], [71.0, 71.31], [73.0, 75.37], [77.0, 78.02], [80.0, 80.5], [82.0, 81.78], [94.0, 95.17], [98.0, 102.32], [103.0, 103.62], [105.0, 105.63], [107.0, 108.21], [109.0, 109.71], [112.0, 112.09], [113.0, 114.71], [127.0, 127.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.55, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.52, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 4.18, 0.89, 1.64, 4.77, 0.55, 1.81, 0.94, 0.09, 0.65, 1.29, 0.71, 0.8, 0.54, -0.3, 0.15, 1.3, 1.37, 1.85, 3.62, 0.31, 2.37, 1.02, 0.5, -0.22, 1.17, 4.32, 0.62, 0.63, 1.21, 0.71, 0.09, 1.71, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/wTz_kSiZaIM_filtered.json b/annotations_filtered/wTz_kSiZaIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..352fea0f9c6923d2a6486999dbbe9e3dda90dad2 --- /dev/null +++ b/annotations_filtered/wTz_kSiZaIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[93.0, 93.63], [95.0, 125.59], [128.0, 128.7], [132.0, 136.31], [140.0, 143.07]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 49.73, 81.35], "audiomae_on_audioset": [null, null, null, [["crushing", 25.72], ["music", 25.56], ["wood", 16.91]], null], "duration": [0.63, 30.59, 0.7, 4.31, 3.07]} \ No newline at end of file diff --git a/annotations_filtered/wTzfJT3zGz0_filtered.json b/annotations_filtered/wTzfJT3zGz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74f93a445cafa48e39d741f88e3348a32ed71ba4 --- /dev/null +++ b/annotations_filtered/wTzfJT3zGz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.62], [23.0, 23.21], [38.0, 52.15], [56.0, 61.28], [65.0, 76.99], [79.0, 79.32], [80.0, 86.73], [92.0, 97.38], [98.0, 101.04], [110.0, 121.26], [124.0, 127.79]], "keep_status": [false, false, true, true, false, false, true, false, false, false, true], "silence_prob": [37.9, 0.0, 31.39, 32.02, 33.72, 0.0, 34.96, 35.18, 35.66, 33.48, 30.22], "audiomae_on_audioset": [[["hum", 39.93], ["throbbing", 27.94], ["music", 10.53]], null, [["cattle, bovinae", 19.77], ["livestock, farm animals, working animals", 16.49], ["moo", 16.46]], [["music", 30.27], ["speech", 17.16], ["mains hum", 14.98]], [["music", 32.29], ["throbbing", 31.45], ["hum", 15.18]], null, [["music", 38.85], ["throbbing", 22.3], ["hum", 6.55]], [["throbbing", 46.5], ["music", 36.69], ["hum", 9.92]], [["music", 54.91], ["throbbing", 14.32], ["hum", 7.77]], [["hum", 37.39], ["speech", 18.98], ["throbbing", 15.09]], [["music", 20.77], ["throbbing", 19.19], ["hum", 17.96]]], "duration": [2.62, 0.21, 14.15, 5.28, 11.99, 0.32, 6.73, 5.38, 3.04, 11.26, 3.79]} \ No newline at end of file diff --git a/annotations_filtered/wU7TupjcCbo_filtered.json b/annotations_filtered/wU7TupjcCbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0cc3d5600e918053a9f3a0d41e6f145f73b84b6 --- /dev/null +++ b/annotations_filtered/wU7TupjcCbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.8], [13.0, 14.66], [15.0, 20.06], [24.0, 28.81], [62.0, 63.12], [64.0, 65.4], [67.0, 69.99], [73.0, 73.28], [86.0, 85.83]], "keep_status": [false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 28.98, 29.05, 0.0, 0.0, 29.49, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.9], ["drum and bass", 4.07], ["didgeridoo", 1.99]], [["music", 50.01], ["electric shaver, electric razor", 7.41], ["drum and bass", 6.43]], null, null, [["music", 36.24], ["drum and bass", 14.07], ["didgeridoo", 6.89]], null, null], "duration": [1.8, 1.66, 5.06, 4.81, 1.12, 1.4, 2.99, 0.28, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/wUEYIhP_9ag_filtered.json b/annotations_filtered/wUEYIhP_9ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4b09686eb759b9d259c0c3611392fd8e03a8603 --- /dev/null +++ b/annotations_filtered/wUEYIhP_9ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.33], [14.0, 27.04], [31.0, 32.37], [45.0, 45.52], [48.0, 48.05], [50.0, 50.75], [54.0, 54.26], [63.0, 63.51], [69.0, 69.09], [73.0, 81.82], [82.0, 82.95], [85.0, 91.1], [93.0, 119.08], [121.0, 126.76], [127.0, 128.51], [129.0, 130.45], [135.0, 138.42], [142.0, 146.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [38.55, 32.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 32.95, 32.92, 33.6, 0.0, 0.0, 46.02, 46.86], "audiomae_on_audioset": [[["music", 59.73], ["musical instrument", 6.59], ["synthesizer", 5.29]], [["music", 77.35], ["throbbing", 2.9], ["electronic music", 2.68]], null, null, null, null, null, null, null, [["music", 78.11], ["theremin", 8.23], ["opera", 4.72]], null, [["music", 80.91], ["opera", 8.68], ["singing", 2.43]], [["music", 83.25], ["theremin", 4.65], ["classical music", 2.5]], [["music", 78.99], ["theremin", 5.53], ["opera", 3.15]], null, null, [["music", 48.7], ["yodeling", 10.17], ["singing", 4.8]], [["music", 58.24], ["theremin", 10.65], ["mantra", 3.96]]], "duration": [2.33, 13.04, 1.37, 0.52, 0.05, 0.75, 0.26, 0.51, 0.09, 8.82, 0.95, 6.1, 26.08, 5.76, 1.51, 1.45, 3.42, 4.58]} \ No newline at end of file diff --git a/annotations_filtered/wUJccK4lV74_filtered.json b/annotations_filtered/wUJccK4lV74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25267da637126443b9cca58f9d60967570080176 --- /dev/null +++ b/annotations_filtered/wUJccK4lV74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [6.0, 8.53], [18.0, 19.2], [24.0, 24.46], [25.0, 26.86], [30.0, 30.7], [32.0, 33.25], [34.0, 34.59], [50.0, 50.38], [53.0, 54.72], [59.0, 60.79], [69.0, 69.7], [77.0, 80.16], [81.0, 81.97], [83.0, 83.89], [85.0, 85.97], [91.0, 93.33], [94.0, 96.21], [98.0, 114.66], [115.0, 122.91], [123.0, 128.49], [129.0, 131.75], [132.0, 133.41], [134.0, 138.06], [140.0, 141.57], [143.0, 143.95], [144.0, 144.81], [146.0, 146.79], [148.0, 148.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.97, 100.0, 54.04, 93.76, 99.96, 98.93, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 2.53, 1.2, 0.46, 1.86, 0.7, 1.25, 0.59, 0.38, 1.72, 1.79, 0.7, 3.16, 0.97, 0.89, 0.97, 2.33, 2.21, 16.66, 7.91, 5.49, 2.75, 1.41, 4.06, 1.57, 0.95, 0.81, 0.79, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/wUP31hGC1A0_filtered.json b/annotations_filtered/wUP31hGC1A0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6cb4548d1f9374925df180259e4e837f75ea381 --- /dev/null +++ b/annotations_filtered/wUP31hGC1A0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [34.0, 33.78], [44.0, 44.63], [53.0, 54.09], [55.0, 55.7], [57.0, 57.6], [61.0, 61.75], [65.0, 71.83], [74.0, 75.56]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.47, -0.22, 0.63, 1.09, 0.7, 0.6, 0.75, 6.83, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/wUPc7frUlD8_filtered.json b/annotations_filtered/wUPc7frUlD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04e2f7fd1188daab5a2e762f2d4136c81e50727c --- /dev/null +++ b/annotations_filtered/wUPc7frUlD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.13], [8.0, 29.05], [30.0, 31.36], [32.0, 32.22], [33.0, 33.49], [36.0, 39.9], [42.0, 42.96], [47.0, 48.88], [52.0, 54.3], [56.0, 56.15], [57.0, 59.39], [62.0, 61.7], [63.0, 64.15], [65.0, 67.83], [69.0, 69.77], [73.0, 73.82], [84.0, 84.25], [89.0, 89.02], [91.0, 94.56], [95.0, 97.43], [102.0, 102.59], [105.0, 106.0], [114.0, 114.17], [115.0, 115.52], [116.0, 116.53], [118.0, 122.18]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.0, 0.0, 0.0, 0.0, 76.7, 0.0, 0.0, 90.25, 0.0, 33.04, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 82.61, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 33.33], "audiomae_on_audioset": [null, [["music", 53.8], ["effects unit", 7.36], ["didgeridoo", 4.23]], null, null, null, null, null, null, null, null, [["speech", 25.68], ["mains hum", 14.6], ["hum", 13.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.61], ["hum", 11.18], ["mains hum", 4.83]]], "duration": [1.13, 21.05, 1.36, 0.22, 0.49, 3.9, 0.96, 1.88, 2.3, 0.15, 2.39, -0.3, 1.15, 2.83, 0.77, 0.82, 0.25, 0.02, 3.56, 2.43, 0.59, 1.0, 0.17, 0.52, 0.53, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/wUZxSf_P2r0_filtered.json b/annotations_filtered/wUZxSf_P2r0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c26fad05573e29af043e7c0ef28d81ba88aac13d --- /dev/null +++ b/annotations_filtered/wUZxSf_P2r0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.54], [4.0, 3.99], [6.0, 8.24], [9.0, 10.5], [14.0, 13.83], [15.0, 15.28], [16.0, 16.14], [19.0, 20.65], [22.0, 23.55], [24.0, 24.85], [25.0, 26.5], [27.0, 28.39], [30.0, 30.08], [33.0, 33.37], [36.0, 37.99], [41.0, 41.76], [46.0, 47.29], [48.0, 49.54], [53.0, 53.28], [56.0, 57.69], [60.0, 61.64], [65.0, 66.29], [70.0, 71.29], [72.0, 72.5], [74.0, 74.09], [74.0, 75.03], [76.0, 76.06], [78.0, 78.11], [84.0, 86.43], [91.0, 92.1], [95.0, 95.01], [96.0, 98.46], [101.0, 101.36], [103.0, 107.5], [108.0, 110.0], [110.0, 112.29], [114.0, 115.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 41.09, 0.0, 43.82, 38.88, 41.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.23], ["chirp tone", 13.38], ["sine wave", 11.62]], null, [["speech", 70.8], ["helicopter", 5.53], ["sidetone", 5.29]], [["speech", 27.61], ["insect", 5.22], ["mechanical fan", 4.72]], [["speech", 63.52], ["vehicle", 5.04], ["hum", 3.03]], null], "duration": [1.54, -0.01, 2.24, 1.5, -0.17, 0.28, 0.14, 1.65, 1.55, 0.85, 1.5, 1.39, 0.08, 0.37, 1.99, 0.76, 1.29, 1.54, 0.28, 1.69, 1.64, 1.29, 1.29, 0.5, 0.09, 1.03, 0.06, 0.11, 2.43, 1.1, 0.01, 2.46, 0.36, 4.5, 2.0, 2.29, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/wV-0rTzEedk_filtered.json b/annotations_filtered/wV-0rTzEedk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2bc6f087f95d4806ec6cc666e1bdc874b75d0de --- /dev/null +++ b/annotations_filtered/wV-0rTzEedk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.66], [17.0, 26.23], [30.0, 37.02]], "keep_status": [false, false, false], "silence_prob": [29.0, 29.22, 29.34], "audiomae_on_audioset": [[["music", 85.98], ["hip hop music", 4.38], ["rapping", 2.01]], [["music", 91.66], ["hip hop music", 2.09], ["rapping", 1.22]], [["music", 93.78], ["hip hop music", 2.2], ["rapping", 1.15]]], "duration": [6.66, 9.23, 7.02]} \ No newline at end of file diff --git a/annotations_filtered/wV7vM4-FzJM_filtered.json b/annotations_filtered/wV7vM4-FzJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6710e42b6835bb53dcead3ea23afafef6148144 --- /dev/null +++ b/annotations_filtered/wV7vM4-FzJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [2.0, 3.62], [6.0, 7.92], [8.0, 9.29], [15.0, 15.16], [19.0, 20.01], [29.0, 30.74], [31.0, 32.21], [50.0, 50.8], [52.0, 51.83], [54.0, 53.84], [58.0, 58.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 1.62, 1.92, 1.29, 0.16, 1.01, 1.74, 1.21, 0.8, -0.17, -0.16, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/wVAL10Zb9Q4_filtered.json b/annotations_filtered/wVAL10Zb9Q4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0958696ad9d990ebd667c387e75ee2f646782800 --- /dev/null +++ b/annotations_filtered/wVAL10Zb9Q4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.15], [12.0, 12.56], [13.0, 13.54], [15.0, 15.09], [16.0, 16.21], [20.0, 20.24], [27.0, 27.85], [29.0, 28.71], [33.0, 33.72], [44.0, 44.14], [46.0, 46.97], [48.0, 48.1], [52.0, 70.19], [74.0, 79.78], [98.0, 101.56], [104.0, 104.95], [106.0, 107.55], [110.0, 112.02], [115.0, 116.14], [117.0, 123.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.27, 30.2, 29.16, 0.0, 0.0, 71.72, 0.0, 30.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.34], ["fart", 10.31], ["bouncing", 6.55]], [["explosion", 48.68], ["speech", 30.2], ["burst, pop", 15.39]], [["explosion", 25.32], ["speech", 24.51], ["burst, pop", 16.85]], null, null, null, null, [["speech", 42.72], ["explosion", 22.35], ["burst, pop", 12.07]]], "duration": [1.15, 0.56, 0.54, 0.09, 0.21, 0.24, 0.85, -0.29, 0.72, 0.14, 0.97, 0.1, 18.19, 5.78, 3.56, 0.95, 1.55, 2.02, 1.14, 6.06]} \ No newline at end of file diff --git a/annotations_filtered/wVFNjHAnpcI_filtered.json b/annotations_filtered/wVFNjHAnpcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9cdb9c54d63ebfd1cd56231ca55ec2b6fe4198 --- /dev/null +++ b/annotations_filtered/wVFNjHAnpcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [4.0, 3.75], [4.0, 9.07], [14.0, 15.69], [18.0, 18.71], [36.0, 35.94], [36.0, 43.98], [49.0, 49.74], [52.0, 51.76], [52.0, 53.64], [56.0, 56.05], [58.0, 58.55], [63.0, 66.06], [93.0, 97.09]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.42, 0.0, 0.0, 0.0, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 40.41, 99.71], "audiomae_on_audioset": [null, null, [["speech", 44.69], ["computer keyboard", 10.57], ["typewriter", 10.21]], null, null, null, [["speech", 68.54], ["noise", 17.93], ["telephone", 2.66]], null, null, null, null, null, [["speech", 59.73], ["telephone", 8.25], ["radio", 4.52]], null], "duration": [0.81, -0.25, 5.07, 1.69, 0.71, -0.06, 7.98, 0.74, -0.24, 1.64, 0.05, 0.55, 3.06, 4.09]} \ No newline at end of file diff --git a/annotations_filtered/wVP1wO_E4yk_filtered.json b/annotations_filtered/wVP1wO_E4yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wVP1wO_E4yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wVWk6IfRuEE_filtered.json b/annotations_filtered/wVWk6IfRuEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..529d8e3345feca5aa3758fb60b71104795dd2f59 --- /dev/null +++ b/annotations_filtered/wVWk6IfRuEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.27], [11.0, 11.53], [15.0, 16.01], [18.0, 18.44], [19.0, 19.82], [21.0, 22.44], [25.0, 27.08], [29.0, 29.91], [40.0, 41.28], [43.0, 46.23], [52.0, 53.13], [58.0, 59.14], [59.0, 61.99], [66.0, 65.8], [78.0, 80.79], [85.0, 86.75], [88.0, 89.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 67.76, 0.0, 0.0, 43.08, 0.0, 59.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.09], ["whale vocalization", 19.08], ["stomach rumble", 6.02]], null, null, null, null], "duration": [1.27, 0.53, 1.01, 0.44, 0.82, 1.44, 2.08, 0.91, 1.28, 3.23, 1.13, 1.14, 2.99, -0.2, 2.79, 1.75, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/wVpIChmQ7dQ_filtered.json b/annotations_filtered/wVpIChmQ7dQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2ef7dcc2b6d647a86487053c72e03d3181a581c --- /dev/null +++ b/annotations_filtered/wVpIChmQ7dQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [6.0, 8.04], [13.0, 13.9], [19.0, 19.5], [26.0, 26.1], [27.0, 27.8], [30.0, 30.47], [32.0, 35.19], [36.0, 46.48], [51.0, 54.7], [56.0, 57.42], [59.0, 59.04], [61.0, 61.13], [62.0, 63.14], [64.0, 64.99], [66.0, 66.8], [69.0, 70.07], [73.0, 73.68], [76.0, 97.77], [99.0, 100.21], [101.0, 101.34], [102.0, 104.01], [105.0, 107.67], [109.0, 109.66], [110.0, 111.0], [113.0, 113.71], [117.0, 117.21], [120.0, 120.38], [123.0, 125.58], [126.0, 126.67]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 35.57, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.38, 0.0, 0.0, 99.36, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 31.47], ["music", 25.83], ["gong", 13.66]], [["music", 43.7], ["speech", 16.2], ["theremin", 5.64]], [["theremin", 38.2], ["music", 35.44], ["musical instrument", 3.04]], null, null, null, null, null, null, null, null, [["speech", 49.5], ["radio", 23.21], ["noise", 4.57]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 2.04, 0.9, 0.5, 0.1, 0.8, 0.47, 3.19, 10.48, 3.7, 1.42, 0.04, 0.13, 1.14, 0.99, 0.8, 1.07, 0.68, 21.77, 1.21, 0.34, 2.01, 2.67, 0.66, 1.0, 0.71, 0.21, 0.38, 2.58, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/wVsMJ0ntvmc_filtered.json b/annotations_filtered/wVsMJ0ntvmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c13c0cb681931983067f381603dd152d5cb5123 --- /dev/null +++ b/annotations_filtered/wVsMJ0ntvmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [5.0, 8.38], [9.0, 11.82], [13.0, 13.74], [15.0, 15.79], [19.0, 19.01], [20.0, 21.29], [21.0, 22.99], [27.0, 26.97], [32.0, 32.59]], "keep_status": [false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.4, 37.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.42], ["whale vocalization", 11.82], ["hiccup", 7.2]], [["bee, wasp, etc.", 57.94], ["fly, housefly", 24.11], ["insect", 11.16]], null, null, null, null, null, null, null], "duration": [0.81, 3.38, 2.82, 0.74, 0.79, 0.01, 1.29, 1.99, -0.03, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/wW0L86VZScs_filtered.json b/annotations_filtered/wW0L86VZScs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfc65ffba17b301ea9f25630feea51e9bc3ecbf7 --- /dev/null +++ b/annotations_filtered/wW0L86VZScs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.31], [24.0, 24.9], [25.0, 25.12], [25.0, 27.33], [30.0, 34.75], [36.0, 36.09], [36.0, 38.18], [39.0, 46.13], [50.0, 58.01], [62.0, 64.62], [66.0, 67.0], [68.0, 70.7], [73.0, 73.38], [75.0, 75.57], [81.0, 88.99], [96.0, 100.09], [100.0, 100.43], [101.0, 100.58], [101.0, 104.95], [108.0, 118.69], [120.0, 122.2], [123.0, 122.81]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.24, 40.01, 0.0, 93.91, 46.05, 57.4, 93.91, 0.0, 95.23, 0.0, 0.0, 33.95, 35.09, 0.0, 0.0, 43.82, 37.01, 39.3, 0.0], "audiomae_on_audioset": [null, null, null, [["fart", 23.96], ["speech", 19.92], ["sine wave", 4.64]], [["fly, housefly", 24.49], ["mosquito", 19.95], ["insect", 11.1]], null, null, [["speech", 23.05], ["hum", 11.95], ["mains hum", 9.44]], null, null, null, null, null, null, [["music", 60.98], ["speech", 9.62], ["didgeridoo", 6.21]], [["cattle, bovinae", 43.95], ["moo", 31.19], ["livestock, farm animals, working animals", 14.82]], null, null, [["speech", 18.57], ["single-lens reflex camera", 15.48], ["music", 7.21]], [["music", 74.98], ["speech", 4.66], ["didgeridoo", 3.56]], [["speech", 41.29], ["music", 28.16], ["boing", 10.65]], null], "duration": [1.31, 0.9, 0.12, 2.33, 4.75, 0.09, 2.18, 7.13, 8.01, 2.62, 1.0, 2.7, 0.38, 0.57, 7.99, 4.09, 0.43, -0.42, 3.95, 10.69, 2.2, -0.19]} \ No newline at end of file diff --git a/annotations_filtered/wW0WRqnLYMw_filtered.json b/annotations_filtered/wW0WRqnLYMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a211e1713a96952f52572b5df14558aff240ecb8 --- /dev/null +++ b/annotations_filtered/wW0WRqnLYMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.38], [12.0, 18.77], [20.0, 20.68], [21.0, 30.35], [40.0, 45.64], [85.0, 84.97], [97.0, 102.49], [103.0, 102.86], [103.0, 103.76], [104.0, 103.94], [104.0, 115.26], [116.0, 120.82], [126.0, 126.82], [129.0, 131.26], [133.0, 134.4], [137.0, 138.47], [141.0, 141.2], [143.0, 144.12], [149.0, 149.88], [168.0, 174.66], [177.0, 197.95], [199.0, 200.35], [207.0, 208.62], [210.0, 214.3], [218.0, 219.0]], "keep_status": [false, true, false, true, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [37.49, 43.77, 0.0, 30.49, 43.08, 0.0, 37.58, 0.0, 0.0, 0.0, 36.88, 32.42, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 52.8, 31.14, 0.0, 0.0, 29.76, 0.0], "audiomae_on_audioset": [[["music", 37.91], ["theremin", 27.39], ["synthesizer", 10.47]], [["music", 22.98], ["hum", 14.83], ["mains hum", 8.81]], null, [["music", 33.29], ["speech", 14.67], ["boing", 6.62]], [["music", 39.76], ["whale vocalization", 10.16], ["didgeridoo", 4.51]], null, [["music", 42.42], ["speech", 15.54], ["musical instrument", 6.74]], null, null, null, [["music", 65.96], ["synthesizer", 7.86], ["electronic music", 5.35]], [["music", 20.87], ["effects unit", 11.03], ["synthesizer", 6.08]], null, null, null, null, null, null, null, null, [["music", 20.49], ["vehicle", 11.33], ["car", 4.9]], null, null, [["civil defense siren", 37.02], ["siren", 23.26], ["speech", 6.2]], null], "duration": [8.38, 6.77, 0.68, 9.35, 5.64, -0.03, 5.49, -0.14, 0.76, -0.06, 11.26, 4.82, 0.82, 2.26, 1.4, 1.47, 0.2, 1.12, 0.88, 6.66, 20.95, 1.35, 1.62, 4.3, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/wWKQ2aOTfN0_filtered.json b/annotations_filtered/wWKQ2aOTfN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7acb5b7e3c2653d5561201e64d309691d616207c --- /dev/null +++ b/annotations_filtered/wWKQ2aOTfN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [2.0, 2.61], [5.0, 5.75], [9.0, 10.03], [10.0, 11.03], [15.0, 14.76], [15.0, 16.14], [17.0, 29.35], [32.0, 47.21], [51.0, 113.8], [117.0, 118.18], [119.0, 120.12], [121.0, 124.8], [126.0, 127.36]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59, 29.38, 0.0, 0.0, 0.0, 85.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.42], ["cattle, bovinae", 10.9], ["grunt", 5.7]], [["hum", 35.07], ["mains hum", 16.96], ["throbbing", 14.83]], null, null, null, null, null], "duration": [0.06, 0.61, 0.75, 1.03, 1.03, -0.24, 1.14, 12.35, 15.21, 62.8, 1.18, 1.12, 3.8, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/wWRnv1V8iUY_filtered.json b/annotations_filtered/wWRnv1V8iUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42e2292c045d97b58181c1108999d09743babed5 --- /dev/null +++ b/annotations_filtered/wWRnv1V8iUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.73], [8.0, 8.6], [10.0, 13.64], [19.0, 22.62], [26.0, 26.52], [27.0, 28.22], [40.0, 40.56], [43.0, 43.88], [44.0, 46.47], [49.0, 50.99], [51.0, 51.9], [54.0, 56.19], [57.0, 57.65], [59.0, 59.49], [62.0, 63.66], [65.0, 66.82], [68.0, 69.16], [72.0, 73.23], [75.0, 76.5], [81.0, 84.28], [90.0, 90.41], [92.0, 96.82], [103.0, 131.13], [133.0, 136.49], [141.0, 141.69], [146.0, 149.42], [152.0, 152.51], [154.0, 158.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 96.89, 34.02, 0.0, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.06, 0.0, 30.37, 29.82, 97.73, 0.0, 30.33, 0.0, 39.46], "audiomae_on_audioset": [null, null, null, [["theremin", 42.52], ["music", 37.2], ["wind instrument, woodwind instrument", 2.14]], null, null, null, null, [["music", 19.56], ["speech", 16.36], ["musical instrument", 2.49]], null, null, [["music", 41.57], ["noise", 9.57], ["fart", 7.64]], null, null, null, null, null, null, null, [["music", 35.04], ["speech", 10.66], ["foghorn", 7.19]], null, [["music", 42.21], ["speech", 7.99], ["didgeridoo", 5.06]], [["speech", 36.37], ["music", 18.02], ["throbbing", 7.55]], null, null, [["music", 20.78], ["whale vocalization", 10.77], ["musical instrument", 7.86]], null, [["music", 24.47], ["speech", 20.52], ["moo", 9.98]]], "duration": [0.73, 0.6, 3.64, 3.62, 0.52, 1.22, 0.56, 0.88, 2.47, 1.99, 0.9, 2.19, 0.65, 0.49, 1.66, 1.82, 1.16, 1.23, 1.5, 3.28, 0.41, 4.82, 28.13, 3.49, 0.69, 3.42, 0.51, 4.45]} \ No newline at end of file diff --git a/annotations_filtered/wWrB-Gbjnik_filtered.json b/annotations_filtered/wWrB-Gbjnik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c93adbe955b44066eedbf044e28439c4074b033 --- /dev/null +++ b/annotations_filtered/wWrB-Gbjnik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.04], [21.0, 21.71], [27.0, 29.39], [38.0, 38.89], [40.0, 40.49], [44.0, 44.58], [49.0, 49.38], [50.0, 51.33], [53.0, 53.76], [73.0, 73.57], [118.0, 118.15], [120.0, 120.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 0.71, 2.39, 0.89, 0.49, 0.58, 0.38, 1.33, 0.76, 0.57, 0.15, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/wWswgKOqkZM_filtered.json b/annotations_filtered/wWswgKOqkZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bfcda59d14305e37507a2d533a499b5c95a3f20 --- /dev/null +++ b/annotations_filtered/wWswgKOqkZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.37], [8.0, 9.36], [10.0, 11.75], [14.0, 15.08], [22.0, 22.18], [26.0, 31.83], [34.0, 37.67], [39.0, 39.6], [42.0, 44.22], [45.0, 47.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 99.8, 0.0, 99.52, 97.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 1.36, 1.75, 1.08, 0.18, 5.83, 3.67, 0.6, 2.22, 2.51]} \ No newline at end of file diff --git a/annotations_filtered/wX2AeW_M-xc_filtered.json b/annotations_filtered/wX2AeW_M-xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03a80048085c44889751358850bb5aab809a12c5 --- /dev/null +++ b/annotations_filtered/wX2AeW_M-xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.22], [18.0, 20.04], [24.0, 24.38], [25.0, 26.62], [36.0, 36.24], [36.0, 37.89], [39.0, 60.42], [61.0, 104.26], [105.0, 121.22], [124.0, 124.36], [126.0, 148.63], [156.0, 158.31], [159.0, 161.64], [162.0, 162.5], [169.0, 174.34], [175.0, 177.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 97.22, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 100.0, 0.0, 97.11, 100.0, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.22, 2.04, 0.38, 1.62, 0.24, 1.89, 21.42, 43.26, 16.22, 0.36, 22.63, 2.31, 2.64, 0.5, 5.34, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/wXDgyuxBuBU_filtered.json b/annotations_filtered/wXDgyuxBuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a53be61512e7f1bac882c1a8816816be871c94f --- /dev/null +++ b/annotations_filtered/wXDgyuxBuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.79], [39.0, 39.34], [41.0, 41.69], [42.0, 43.07], [44.0, 45.72], [47.0, 47.11], [48.0, 49.42], [57.0, 57.57], [60.0, 62.68], [63.0, 63.48], [67.0, 66.92], [67.0, 67.95], [78.0, 78.97], [89.0, 89.31], [91.0, 91.2], [92.0, 101.04], [104.0, 108.57], [111.0, 112.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 38.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.11], ["speech", 8.71], ["fart", 8.13]], null], "duration": [0.79, 0.34, 0.69, 1.07, 1.72, 0.11, 1.42, 0.57, 2.68, 0.48, -0.08, 0.95, 0.97, 0.31, 0.2, 9.04, 4.57, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/wXLFg03in2U_filtered.json b/annotations_filtered/wXLFg03in2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd5f6523bcb72dadf24f6b0160abe5ec7a31347c --- /dev/null +++ b/annotations_filtered/wXLFg03in2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 50.43], [52.0, 52.19], [54.0, 54.87], [57.0, 57.47], [58.0, 88.62], [91.0, 94.61], [96.0, 96.23], [97.0, 99.0], [100.0, 102.39], [104.0, 130.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.36, 0.0, 0.0, 0.0, 0.0, 32.36, 0.0, 32.01, 31.4, 30.11], "audiomae_on_audioset": [[["music", 25.7], ["hum", 11.3], ["throbbing", 9.08]], null, null, null, null, [["music", 65.54], ["didgeridoo", 14.17], ["musical instrument", 3.35]], null, [["music", 61.34], ["speech", 17.86], ["throbbing", 9.72]], [["music", 39.64], ["throbbing", 32.07], ["hum", 10.58]], [["music", 54.58], ["speech", 13.34], ["throbbing", 5.78]]], "duration": [11.43, 0.19, 0.87, 0.47, 30.62, 3.61, 0.23, 2.0, 2.39, 26.72]} \ No newline at end of file diff --git a/annotations_filtered/wXQ1EhVW2xQ_filtered.json b/annotations_filtered/wXQ1EhVW2xQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1311b53c1c5588e6f1ed3e6837c290fd55b30480 --- /dev/null +++ b/annotations_filtered/wXQ1EhVW2xQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [4.0, 18.71], [22.0, 24.87], [26.0, 29.05], [30.0, 33.12], [34.0, 36.66], [39.0, 41.34], [42.0, 45.27], [46.0, 49.11], [50.0, 59.98], [60.0, 61.3], [63.0, 65.28], [66.0, 66.72], [67.0, 66.93], [67.0, 70.5], [73.0, 74.09], [76.0, 82.9], [86.0, 90.12], [93.0, 96.52], [97.0, 99.84], [104.0, 105.39], [107.0, 110.51], [119.0, 119.99], [121.0, 121.12], [121.0, 122.18], [124.0, 127.25], [129.0, 130.76], [132.0, 137.59], [138.0, 140.48], [141.0, 144.71], [146.0, 150.06], [152.0, 153.99], [155.0, 156.61], [161.0, 161.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.97, 87.55, 100.0, 100.0, 100.0, 100.0, 99.73, 99.84, 99.4, 0.0, 85.72, 0.0, 0.0, 68.93, 0.0, 97.54, 99.97, 82.07, 99.56, 0.0, 97.22, 0.0, 0.0, 0.0, 96.04, 0.0, 97.11, 90.43, 94.37, 94.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 14.71, 2.87, 3.05, 3.12, 2.66, 2.34, 3.27, 3.11, 9.98, 1.3, 2.28, 0.72, -0.07, 3.5, 1.09, 6.9, 4.12, 3.52, 2.84, 1.39, 3.51, 0.99, 0.12, 1.18, 3.25, 1.76, 5.59, 2.48, 3.71, 4.06, 1.99, 1.61, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/wXWoyVboDpI_filtered.json b/annotations_filtered/wXWoyVboDpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6469459d21941b57d66b8801a5d59aa0e45ebbd2 --- /dev/null +++ b/annotations_filtered/wXWoyVboDpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 43.39], [45.0, 51.31], [52.0, 53.15], [54.0, 54.9], [56.0, 63.54], [65.0, 66.7], [68.0, 70.83], [73.0, 76.05], [77.0, 79.84], [81.0, 81.73], [82.0, 104.19], [110.0, 112.63], [114.0, 113.7], [116.0, 116.26], [119.0, 119.87], [120.0, 125.2]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.88, 34.09, 0.0, 0.0, 33.94, 0.0, 55.04, 56.18, 55.18, 0.0, 32.3, 70.86, 0.0, 0.0, 0.0, 49.87], "audiomae_on_audioset": [[["hum", 25.47], ["mains hum", 16.61], ["music", 15.69]], [["music", 50.05], ["scary music", 11.71], ["hum", 11.48]], null, null, [["music", 27.05], ["hum", 23.9], ["noise", 17.61]], null, null, null, null, null, [["music", 32.02], ["hum", 25.5], ["mains hum", 15.63]], null, null, null, null, [["speech", 35.16], ["music", 15.23], ["hum", 9.49]]], "duration": [16.39, 6.31, 1.15, 0.9, 7.54, 1.7, 2.83, 3.05, 2.84, 0.73, 22.19, 2.63, -0.3, 0.26, 0.87, 5.2]} \ No newline at end of file diff --git a/annotations_filtered/wXYRFo4rrrw_filtered.json b/annotations_filtered/wXYRFo4rrrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b665b383192788f96f135b7cd88e3ac7b665e98f --- /dev/null +++ b/annotations_filtered/wXYRFo4rrrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [23.0, 23.57], [31.0, 32.19], [33.0, 36.14], [41.0, 42.35], [47.0, 49.99], [50.0, 51.12], [72.0, 72.69]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.72, 0.0, 56.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.97, 0.57, 1.19, 3.14, 1.35, 2.99, 1.12, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/wXer1Hj8hR4_filtered.json b/annotations_filtered/wXer1Hj8hR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e4cf7f0b1ad0e6cc29961fbf3380fb476562ce5 --- /dev/null +++ b/annotations_filtered/wXer1Hj8hR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.42], [11.0, 12.48], [23.0, 23.8], [24.0, 25.15], [26.0, 26.32], [28.0, 28.81], [31.0, 31.55], [35.0, 35.02], [40.0, 41.34], [46.0, 47.26], [50.0, 50.62], [52.0, 52.64], [60.0, 61.25], [77.0, 78.61], [82.0, 82.85], [83.0, 85.31], [86.0, 86.44], [87.0, 89.67], [90.0, 95.0], [96.0, 97.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 56.03, 50.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 1.48, 0.8, 1.15, 0.32, 0.81, 0.55, 0.02, 1.34, 1.26, 0.62, 0.64, 1.25, 1.61, 0.85, 2.31, 0.44, 2.67, 5.0, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/wXf_eaQcSdM_filtered.json b/annotations_filtered/wXf_eaQcSdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..386c0c062296d3b14bb75837dd6000f4f71d979a --- /dev/null +++ b/annotations_filtered/wXf_eaQcSdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.55], [53.0, 52.91], [65.0, 65.65], [67.0, 66.63], [75.0, 75.61], [77.0, 80.67], [126.0, 127.6]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.55, -0.09, 0.65, -0.37, 0.61, 3.67, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/wXnYmZhdm04_filtered.json b/annotations_filtered/wXnYmZhdm04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf39e704105414aaaca478d4d9e31ac067f094d --- /dev/null +++ b/annotations_filtered/wXnYmZhdm04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [10.0, 12.14], [16.0, 19.43], [20.0, 19.55], [21.0, 21.47], [22.0, 23.08], [26.0, 25.96], [33.0, 45.5], [46.0, 45.76], [47.0, 47.09], [53.0, 53.45], [61.0, 62.5], [64.0, 70.39], [71.0, 71.36], [72.0, 72.17], [78.0, 79.12], [80.0, 81.14], [82.0, 82.95], [87.0, 89.02], [89.0, 91.79], [93.0, 101.46], [104.0, 110.25], [115.0, 116.45], [117.0, 116.82], [119.0, 119.5], [121.0, 121.09]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 44.23, 0.0, 0.0, 0.0, 0.0, 33.18, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 0.0, 0.0, 57.72, 29.44, 52.56, 66.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 26.99], ["speech", 21.59], ["animal", 8.58]], null, null, null, null, [["music", 62.02], ["speech", 7.04], ["grunt", 3.79]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.88], ["electric shaver, electric razor", 19.84], ["livestock, farm animals, working animals", 6.2]], null, null, null, null, null, null], "duration": [1.39, 2.14, 3.43, -0.45, 0.47, 1.08, -0.04, 12.5, -0.24, 0.09, 0.45, 1.5, 6.39, 0.36, 0.17, 1.12, 1.14, 0.95, 2.02, 2.79, 8.46, 6.25, 1.45, -0.18, 0.5, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/wYEn-ZKSg_I_filtered.json b/annotations_filtered/wYEn-ZKSg_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df9b1942a32668b88f370ca8308306b2d0b85f0c --- /dev/null +++ b/annotations_filtered/wYEn-ZKSg_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [6.0, 11.2], [17.0, 21.78], [24.0, 24.34], [26.0, 26.5], [28.0, 28.83], [30.0, 30.59], [33.0, 33.03], [35.0, 35.45], [38.0, 38.03], [41.0, 42.74], [45.0, 51.93], [53.0, 53.72], [55.0, 56.81], [58.0, 59.9], [61.0, 61.79], [67.0, 67.26], [69.0, 71.25], [72.0, 72.49], [74.0, 76.27], [79.0, 80.32], [82.0, 83.89], [85.0, 93.41], [96.0, 96.58], [99.0, 100.94], [110.0, 116.41], [117.0, 121.61], [123.0, 132.26], [133.0, 139.68], [140.0, 140.09], [144.0, 144.19], [150.0, 150.36], [155.0, 155.58], [164.0, 173.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.79, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 59.77, 0.0, 0.0, 31.2, 0.0, 0.0, 32.62, 34.11, 35.18, 31.44, 0.0, 0.0, 0.0, 0.0, 37.85], "audiomae_on_audioset": [null, [["fly, housefly", 31.0], ["mosquito", 27.76], ["insect", 19.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 47.16], ["insect", 28.79], ["mosquito", 14.62]], null, null, [["theremin", 54.16], ["music", 31.83], ["musical instrument", 3.83]], [["theremin", 52.29], ["music", 24.89], ["musical instrument", 5.58]], [["music", 69.51], ["theremin", 10.0], ["musical instrument", 7.76]], [["music", 62.6], ["musical instrument", 6.18], ["speech", 2.94]], null, null, null, null, [["music", 22.6], ["speech", 19.46], ["frog", 9.57]]], "duration": [0.82, 5.2, 4.78, 0.34, 0.5, 0.83, 0.59, 0.03, 0.45, 0.03, 1.74, 6.93, 0.72, 1.81, 1.9, 0.79, 0.26, 2.25, 0.49, 2.27, 1.32, 1.89, 8.41, 0.58, 1.94, 6.41, 4.61, 9.26, 6.68, 0.09, 0.19, 0.36, 0.58, 9.8]} \ No newline at end of file diff --git a/annotations_filtered/wYMJal35N0o_filtered.json b/annotations_filtered/wYMJal35N0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b15b51a714b0c94ba279e117db50567fb1b42dc --- /dev/null +++ b/annotations_filtered/wYMJal35N0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 94.85], [98.0, 104.38]], "keep_status": [false, false], "silence_prob": [0.0, 44.15], "audiomae_on_audioset": [null, [["hum", 42.48], ["mains hum", 22.71], ["whale vocalization", 12.35]]], "duration": [-0.15, 6.38]} \ No newline at end of file diff --git a/annotations_filtered/wYMfDxQdnUc_filtered.json b/annotations_filtered/wYMfDxQdnUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889e5d698adf88dd20692a80242ca6fc82aea13c --- /dev/null +++ b/annotations_filtered/wYMfDxQdnUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.34], [6.0, 6.54], [16.0, 16.7], [20.0, 20.33], [22.0, 21.91], [24.0, 24.53], [26.0, 27.35], [30.0, 30.11], [32.0, 32.1], [43.0, 43.36], [46.0, 48.79], [53.0, 53.42], [54.0, 54.23], [55.0, 55.09], [56.0, 56.71], [60.0, 61.52], [66.0, 66.26], [68.0, 69.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 44.12], ["boing", 16.28], ["speech", 9.74]], null, null, null, null, null, null, null], "duration": [0.34, 0.54, 0.7, 0.33, -0.09, 0.53, 1.35, 0.11, 0.1, 0.36, 2.79, 0.42, 0.23, 0.09, 0.71, 1.52, 0.26, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/wYSIce1SzFU_filtered.json b/annotations_filtered/wYSIce1SzFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1dacc336dcb07be4b6bdddf62141e9e0a72253a --- /dev/null +++ b/annotations_filtered/wYSIce1SzFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.32], [12.0, 14.91], [17.0, 109.61]], "keep_status": [false, false, false], "silence_prob": [71.29, 64.97, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [2.32, 2.91, 92.61]} \ No newline at end of file diff --git a/annotations_filtered/wYwlDchIasw_filtered.json b/annotations_filtered/wYwlDchIasw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..490aed1952e054639ec0b440fde51439079d1337 --- /dev/null +++ b/annotations_filtered/wYwlDchIasw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.18], [21.0, 21.29], [44.0, 44.12], [45.0, 47.97], [49.0, 50.16], [52.0, 53.59], [56.0, 57.4], [58.0, 63.51], [78.0, 78.17], [91.0, 92.21], [102.0, 102.41], [104.0, 108.16], [109.0, 111.27], [112.0, 113.26], [114.0, 113.95], [114.0, 114.94], [116.0, 117.71], [119.0, 119.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.77, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 76.04, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.2], ["theremin", 16.44], ["speech", 12.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 0.29, 0.12, 2.97, 1.16, 1.59, 1.4, 5.51, 0.17, 1.21, 0.41, 4.16, 2.27, 1.26, -0.05, 0.94, 1.71, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/wZ30Qxv0vtI_filtered.json b/annotations_filtered/wZ30Qxv0vtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eacb4a6273520d4172ffdb652e108a624b1926a4 --- /dev/null +++ b/annotations_filtered/wZ30Qxv0vtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [8.0, 8.29], [11.0, 18.76], [19.0, 18.86], [20.0, 31.09], [33.0, 33.56], [35.0, 49.57], [53.0, 55.29], [56.0, 56.94], [57.0, 58.01], [60.0, 60.0], [61.0, 62.04], [63.0, 114.12]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.84, 0.0, 32.32, 0.0, 32.24, 49.22, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.02], ["effects unit", 4.87], ["hum", 4.71]], null, [["music", 68.52], ["musical instrument", 5.56], ["trombone", 4.45]], null, [["music", 49.87], ["throbbing", 7.56], ["speech", 4.9]], [["music", 34.86], ["speech", 34.17], ["guitar", 4.53]], null, null, null, null, null], "duration": [1.04, 0.29, 7.76, -0.14, 11.09, 0.56, 14.57, 2.29, 0.94, 1.01, 0.0, 1.04, 51.12]} \ No newline at end of file diff --git a/annotations_filtered/wZTaXoogvDQ_filtered.json b/annotations_filtered/wZTaXoogvDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8423f0066be79f6038d028e9188249b5b3b66ee2 --- /dev/null +++ b/annotations_filtered/wZTaXoogvDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.48], [15.0, 19.84], [21.0, 25.89], [28.0, 33.32], [34.0, 37.56], [40.0, 41.44], [43.0, 45.87], [47.0, 48.34], [50.0, 50.41], [51.0, 52.22], [55.0, 55.8], [59.0, 60.54], [64.0, 64.02], [64.0, 65.53], [76.0, 77.63], [78.0, 83.96], [85.0, 88.1], [89.0, 102.22], [102.0, 106.39], [107.0, 108.99], [110.0, 111.87], [113.0, 114.67], [115.0, 117.51], [118.0, 121.31]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [53.22, 41.54, 54.23, 43.3, 63.64, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.89, 65.79, 44.34, 30.56, 0.0, 0.0, 0.0, 72.01, 51.28], "audiomae_on_audioset": [null, [["music", 31.56], ["throbbing", 17.33], ["hum", 15.56]], null, [["hum", 27.08], ["mains hum", 22.3], ["speech", 17.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 49.92], ["insect", 15.39], ["speech", 8.99]], [["speech", 54.33], ["fly, housefly", 7.5], ["mains hum", 4.8]], null, null, null, null, null], "duration": [3.48, 4.84, 4.89, 5.32, 3.56, 1.44, 2.87, 1.34, 0.41, 1.22, 0.8, 1.54, 0.02, 1.53, 1.63, 5.96, 3.1, 13.22, 4.39, 1.99, 1.87, 1.67, 2.51, 3.31]} \ No newline at end of file diff --git a/annotations_filtered/wZWNmL5VsIs_filtered.json b/annotations_filtered/wZWNmL5VsIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ee387c30ad8d04b897430f152514ca7c55057d --- /dev/null +++ b/annotations_filtered/wZWNmL5VsIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [9.0, 22.35], [27.0, 31.23], [39.0, 39.63], [41.0, 42.15], [43.0, 45.15], [56.0, 56.15], [59.0, 77.18], [82.0, 82.8], [90.0, 90.31], [92.0, 122.18], [136.0, 137.74], [141.0, 143.46], [153.0, 155.44], [159.0, 190.24], [196.0, 196.45], [197.0, 199.0], [200.0, 201.02], [202.0, 204.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 34.48, 36.31, 0.0, 0.0, 37.55, 0.0, 34.02, 0.0, 0.0, 0.0, 0.0, 34.75, 31.79, 0.0, 0.0, 65.2, 0.0, 37.88], "audiomae_on_audioset": [null, [["music", 71.29], ["speech", 8.74], ["synthesizer", 4.86]], [["music", 48.03], ["speech", 24.95], ["throbbing", 2.72]], null, null, [["music", 70.48], ["synthesizer", 7.29], ["throbbing", 7.17]], null, [["music", 40.71], ["speech", 38.95], ["quack", 7.92]], null, null, null, null, [["music", 57.49], ["throbbing", 11.76], ["speech", 6.45]], [["music", 35.09], ["throbbing", 20.84], ["speech", 9.81]], null, null, null, null, [["music", 43.92], ["hum", 14.98], ["mains hum", 10.45]]], "duration": [1.18, 13.35, 4.23, 0.63, 1.15, 2.15, 0.15, 18.18, 0.8, 0.31, 30.18, 1.74, 2.46, 2.44, 31.24, 0.45, 2.0, 1.02, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/wZaCK0PDUMI_filtered.json b/annotations_filtered/wZaCK0PDUMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94746b972e7f4dfde7d2c197f5ff958d824a27d2 --- /dev/null +++ b/annotations_filtered/wZaCK0PDUMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [7.0, 7.91], [20.0, 20.48], [21.0, 22.03], [27.0, 30.54], [31.0, 31.29], [34.0, 42.9], [44.0, 44.71], [45.0, 50.16], [52.0, 52.59], [54.0, 60.3], [61.0, 63.0], [64.0, 75.22], [76.0, 88.1], [92.0, 94.24], [94.0, 101.07], [103.0, 120.21]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.27, 0.0, 58.22, 0.0, 31.88, 0.0, 81.53, 99.87, 33.15, 31.74, 32.85, 33.37, 34.3], "audiomae_on_audioset": [null, null, null, null, [["speech", 19.03], ["music", 18.14], ["fly, housefly", 13.22]], null, null, null, [["speech", 58.97], ["music", 10.86], ["sidetone", 6.62]], null, null, null, [["speech", 21.18], ["music", 18.01], ["boing", 11.52]], [["music", 58.05], ["speech", 6.8], ["fart", 3.18]], [["music", 75.04], ["boing", 4.6], ["cacophony", 1.57]], [["music", 45.1], ["speech", 19.79], ["musical instrument", 5.23]], [["music", 43.68], ["speech", 11.85], ["hum", 5.12]]], "duration": [1.7, 0.91, 0.48, 1.03, 3.54, 0.29, 8.9, 0.71, 5.16, 0.59, 6.3, 2.0, 11.22, 12.1, 2.24, 7.07, 17.21]} \ No newline at end of file diff --git a/annotations_filtered/wZcRiRs1x-8_filtered.json b/annotations_filtered/wZcRiRs1x-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9274f272a0ebd915710269d2952b2fafc769df9b --- /dev/null +++ b/annotations_filtered/wZcRiRs1x-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 36.98], [38.0, 43.85], [45.0, 75.57], [76.0, 87.76], [89.0, 111.64], [116.0, 116.67], [122.0, 139.16]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [70.72, 67.38, 0.0, 61.18, 29.77, 0.0, 28.4], "audiomae_on_audioset": [null, null, null, null, [["music", 86.83], ["swing music", 2.99], ["funk", 1.34]], null, [["cattle, bovinae", 44.11], ["moo", 30.89], ["livestock, farm animals, working animals", 24.5]]], "duration": [16.98, 5.85, 30.57, 11.76, 22.64, 0.67, 17.16]} \ No newline at end of file diff --git a/annotations_filtered/wZheb1gbe58_filtered.json b/annotations_filtered/wZheb1gbe58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4e3ea22e8bbb97db7880a44829a93edb58c0ae5 --- /dev/null +++ b/annotations_filtered/wZheb1gbe58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.44], [12.0, 12.31], [13.0, 14.15]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.44, 0.31, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/wZl5uWOpepU_filtered.json b/annotations_filtered/wZl5uWOpepU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a75b3118a28bf199b7edb3de4667edb503c8b7dc --- /dev/null +++ b/annotations_filtered/wZl5uWOpepU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.56], [28.0, 29.22], [39.0, 41.23], [60.0, 61.33], [77.0, 77.58]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 45.97], ["didgeridoo", 12.42], ["speech", 6.58]], null, null], "duration": [1.56, 1.22, 2.23, 1.33, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/w_5OidjXy5o_filtered.json b/annotations_filtered/w_5OidjXy5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0cac86111ba558449ec3d62a34505e890486b36 --- /dev/null +++ b/annotations_filtered/w_5OidjXy5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.64], [33.0, 45.69], [48.0, 48.69], [49.0, 48.79], [49.0, 49.03], [49.0, 49.08], [51.0, 72.39], [73.0, 79.96], [81.0, 90.17], [92.0, 94.91], [96.0, 97.11], [98.0, 117.95], [118.0, 118.44], [118.0, 160.89], [161.0, 161.25], [161.0, 161.33], [161.0, 161.45]], "keep_status": [false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [31.0, 31.21, 0.0, 0.0, 0.0, 0.0, 30.77, 31.67, 31.05, 33.95, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 29.03], ["throbbing", 23.99], ["mains hum", 19.27]], [["fly, housefly", 22.0], ["music", 20.35], ["buzz", 6.86]], null, null, null, null, [["hum", 36.1], ["music", 23.52], ["throbbing", 14.87]], [["hum", 31.29], ["throbbing", 19.84], ["mains hum", 18.16]], [["hum", 35.35], ["music", 21.01], ["throbbing", 14.85]], [["music", 18.36], ["cacophony", 16.2], ["hum", 10.09]], null, [["hum", 66.65], ["mains hum", 15.8], ["throbbing", 7.85]], null, null, null, null, null], "duration": [16.64, 12.69, 0.69, -0.21, 0.03, 0.08, 21.39, 6.96, 9.17, 2.91, 1.11, 19.95, 0.44, 42.89, 0.25, 0.33, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/w_92-vVfgrw_filtered.json b/annotations_filtered/w_92-vVfgrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4002d6f0f47947fbb748fd8c899c5d3f884a593f --- /dev/null +++ b/annotations_filtered/w_92-vVfgrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.18], [36.0, 36.78], [39.0, 40.1], [44.0, 45.42], [58.0, 58.62], [74.0, 75.41], [93.0, 93.06], [99.0, 99.03], [102.0, 120.34], [124.0, 132.95], [134.0, 133.95]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 32.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.08], ["wind chime", 17.6], ["glockenspiel", 10.78]], [["music", 47.15], ["civil defense siren", 10.42], ["siren", 6.07]], null], "duration": [0.18, 0.78, 1.1, 1.42, 0.62, 1.41, 0.06, 0.03, 18.34, 8.95, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/w_e5kx3ONfs_filtered.json b/annotations_filtered/w_e5kx3ONfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185cd6eaa3fef1ca5ef47fe450429423362d9e67 --- /dev/null +++ b/annotations_filtered/w_e5kx3ONfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.53], [15.0, 17.54], [19.0, 19.5], [21.0, 21.79], [23.0, 24.19], [25.0, 25.91], [27.0, 28.38], [31.0, 31.18], [34.0, 35.55], [37.0, 39.38], [41.0, 43.78], [46.0, 46.23], [49.0, 49.98], [52.0, 56.57], [59.0, 61.42], [64.0, 75.42], [78.0, 91.47], [93.0, 95.67], [97.0, 98.15], [102.0, 103.44], [105.0, 106.49]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 41.16, 0.0, 0.0, 46.72, 43.53, 45.69, 62.68, 96.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 48.42], ["mains hum", 5.46], ["ambient music", 4.96]], [["livestock, farm animals, working animals", 32.02], ["cattle, bovinae", 28.95], ["moo", 21.85]], null, null, [["singing bowl", 36.42], ["music", 32.33], ["tubular bells", 6.41]], [["music", 27.66], ["singing bowl", 18.61], ["speech", 7.53]], [["music", 61.17], ["singing bowl", 10.91], ["bell", 6.01]], null, null, null, null, null], "duration": [1.53, 2.54, 0.5, 0.79, 1.19, 0.91, 1.38, 0.18, 1.55, 2.38, 2.78, 0.23, 0.98, 4.57, 2.42, 11.42, 13.47, 2.67, 1.15, 1.44, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/w_tQqymkPdA_filtered.json b/annotations_filtered/w_tQqymkPdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e48912e1c5ae0d75f13f6b20c117a2d11acba0bb --- /dev/null +++ b/annotations_filtered/w_tQqymkPdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [5.0, 6.44], [8.0, 10.15], [11.0, 12.16], [13.0, 14.22], [15.0, 17.54], [19.0, 20.53], [22.0, 23.01], [24.0, 36.73], [38.0, 39.95], [41.0, 42.42], [43.0, 45.94], [47.0, 47.98], [49.0, 50.62], [52.0, 51.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 34.38, 0.0, 0.0, 70.44, 0.0, 0.0, 71.0, 0.0, 0.0, 56.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 60.12], ["sidetone", 32.65], ["chirp tone", 1.27]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 1.44, 2.15, 1.16, 1.22, 2.54, 1.53, 1.01, 12.73, 1.95, 1.42, 2.94, 0.98, 1.62, -0.34]} \ No newline at end of file diff --git a/annotations_filtered/wa1uJbTy6XE_filtered.json b/annotations_filtered/wa1uJbTy6XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b616512aed5293d4cffbe113f3a983f2fe26c9e --- /dev/null +++ b/annotations_filtered/wa1uJbTy6XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.63], [14.0, 18.18], [19.0, 30.43], [38.0, 60.37], [61.0, 62.61], [65.0, 79.39], [84.0, 149.72], [152.0, 152.41], [153.0, 155.19], [157.0, 158.14], [164.0, 164.96], [166.0, 168.0], [169.0, 171.59]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.49, 32.57, 31.84, 0.0, 32.92, 0.0, 0.0, 95.64, 0.0, 0.0, 40.29, 48.06], "audiomae_on_audioset": [null, [["speech", 59.83], ["music", 3.77], ["rumble", 2.68]], [["livestock, farm animals, working animals", 56.08], ["music", 15.93], ["cattle, bovinae", 10.82]], [["speech", 48.0], ["music", 24.54], ["buzz", 4.08]], null, [["music", 39.43], ["mains hum", 13.45], ["hum", 11.95]], null, null, null, null, null, [["fart", 19.31], ["mosquito", 10.85], ["hum", 10.6]], [["music", 80.44], ["hum", 2.17], ["musical instrument", 2.15]]], "duration": [1.63, 4.18, 11.43, 22.37, 1.61, 14.39, 65.72, 0.41, 2.19, 1.14, 0.96, 2.0, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/wa5asCQrdPE_filtered.json b/annotations_filtered/wa5asCQrdPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b648ce6f421f02cb3cd3f033bdce223dce0abf6d --- /dev/null +++ b/annotations_filtered/wa5asCQrdPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 86.86]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [69.86]} \ No newline at end of file diff --git a/annotations_filtered/waE1U01kwxY_filtered.json b/annotations_filtered/waE1U01kwxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f06580a25b850d69df531b9c1a10834ce3b1250 --- /dev/null +++ b/annotations_filtered/waE1U01kwxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.9], [24.0, 24.78], [57.0, 59.02], [79.0, 80.89], [83.0, 85.62], [89.0, 92.3], [113.0, 113.44], [115.0, 115.08], [116.0, 116.31], [120.0, 120.87], [129.0, 128.9]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [29.66, 0.0, 31.83, 0.0, 46.05, 38.58, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 78.93], ["drum machine", 7.01], ["sampler", 3.79]], null, [["music", 26.37], ["throbbing", 12.9], ["hum", 6.45]], null, [["sidetone", 94.04], ["music", 2.71], ["speech", 1.37]], [["speech", 52.53], ["shuffling cards", 9.57], ["fly, housefly", 2.76]], null, null, null, null, null], "duration": [7.9, 0.78, 2.02, 1.89, 2.62, 3.3, 0.44, 0.08, 0.31, 0.87, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/wa_9eIwrEK8_filtered.json b/annotations_filtered/wa_9eIwrEK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fbdb653bfa5675ce117fcdf553f4bdff2d879dd --- /dev/null +++ b/annotations_filtered/wa_9eIwrEK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.67], [15.0, 22.91], [24.0, 41.91], [44.0, 46.8], [48.0, 69.87], [71.0, 71.56], [79.0, 141.84], [143.0, 142.79], [144.0, 144.78], [145.0, 146.42], [148.0, 148.49], [149.0, 151.09], [152.0, 153.54], [156.0, 164.52]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [30.41, 30.78, 29.78, 28.56, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.43, 0.0, 30.52], "audiomae_on_audioset": [[["music", 46.86], ["speech", 15.03], ["didgeridoo", 5.69]], [["music", 38.03], ["speech", 9.27], ["throbbing", 5.29]], [["music", 27.16], ["buzz", 18.54], ["didgeridoo", 7.37]], [["music", 36.68], ["mains hum", 18.89], ["hum", 10.97]], [["speech", 38.93], ["music", 38.07], ["explosion", 3.18]], null, null, null, null, null, null, [["music", 33.35], ["speech", 22.65], ["whale vocalization", 4.14]], null, [["music", 57.24], ["gunshot, gunfire", 5.17], ["speech", 4.45]]], "duration": [3.67, 7.91, 17.91, 2.8, 21.87, 0.56, 62.84, -0.21, 0.78, 1.42, 0.49, 2.09, 1.54, 8.52]} \ No newline at end of file diff --git a/annotations_filtered/waeNIUB5wz4_filtered.json b/annotations_filtered/waeNIUB5wz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5a264f5eafe4ba1061bda8d1b909fe5f59a1d24 --- /dev/null +++ b/annotations_filtered/waeNIUB5wz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.49], [14.0, 14.61], [19.0, 19.01], [28.0, 30.25], [35.0, 36.85], [37.0, 38.2], [39.0, 64.66], [69.0, 78.7], [79.0, 88.28], [96.0, 100.85], [101.0, 103.08], [105.0, 113.09], [116.0, 119.25], [122.0, 122.67], [125.0, 126.22], [127.0, 127.3], [128.0, 128.75]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [33.71, 0.0, 0.0, 40.06, 0.0, 0.0, 33.45, 31.37, 31.98, 31.57, 35.4, 33.48, 87.55, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.44], ["boing", 6.89], ["musical instrument", 5.14]], null, null, [["cattle, bovinae", 12.29], ["moo", 11.0], ["noise", 10.32]], null, null, [["music", 50.21], ["sidetone", 22.2], ["throbbing", 6.28]], [["music", 30.78], ["sidetone", 24.56], ["speech", 15.87]], [["music", 49.58], ["sidetone", 7.13], ["speech", 5.53]], [["music", 50.67], ["speech", 19.7], ["sidetone", 11.0]], [["music", 60.26], ["speech", 15.45], ["musical instrument", 3.12]], [["fart", 30.71], ["music", 23.07], ["throbbing", 10.24]], null, null, null, null, null], "duration": [2.49, 0.61, 0.01, 2.25, 1.85, 1.2, 25.66, 9.7, 9.28, 4.85, 2.08, 8.09, 3.25, 0.67, 1.22, 0.3, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/wb1HDnYPPoo_filtered.json b/annotations_filtered/wb1HDnYPPoo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a2bd69357e81267d128f9d6b8a66d484de86024 --- /dev/null +++ b/annotations_filtered/wb1HDnYPPoo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 127.03]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [115.03]} \ No newline at end of file diff --git a/annotations_filtered/wbMLxj0lKAU_filtered.json b/annotations_filtered/wbMLxj0lKAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbe12bef9554d662aa3453ce7fa5f692a734cef6 --- /dev/null +++ b/annotations_filtered/wbMLxj0lKAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.94], [16.0, 27.68], [28.0, 90.76]], "keep_status": [false, false, false], "silence_prob": [96.42, 98.59, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [9.94, 11.68, 62.76]} \ No newline at end of file diff --git a/annotations_filtered/wbROoMNi8Ho_filtered.json b/annotations_filtered/wbROoMNi8Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e52ebfca14b49c482205bbde5ce76a751021905 --- /dev/null +++ b/annotations_filtered/wbROoMNi8Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [5.0, 5.27], [6.0, 27.95], [30.0, 34.57], [35.0, 52.19], [53.0, 55.16], [56.0, 61.6], [62.0, 65.75], [66.0, 72.25], [75.0, 76.15], [76.0, 85.7], [86.0, 88.75], [90.0, 92.3], [94.0, 95.2], [96.0, 99.94], [100.0, 105.41], [107.0, 113.63], [115.0, 117.53], [119.0, 128.92], [134.0, 138.55], [140.0, 139.95], [140.0, 140.02], [141.0, 144.75], [148.0, 151.04], [155.0, 157.74], [158.0, 169.16], [171.0, 176.22], [177.0, 184.42]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.18, 54.5, 39.3, 100.0, 100.0, 99.4, 73.97, 0.0, 62.78, 99.8, 99.97, 0.0, 98.93, 49.64, 92.15, 53.04, 42.91, 88.83, 0.0, 0.0, 99.71, 88.1, 98.01, 42.04, 99.56, 99.96], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.44], ["fly, housefly", 9.7], ["music", 9.57]], null, null, null, null, null, null, null, null, null, null, [["speech", 79.69], ["telephone", 10.38], ["radio", 4.71]], null, null, [["speech", 45.45], ["bouncing", 7.42], ["boing", 4.1]], null, null, null, null, null, null, [["speech", 45.23], ["music", 26.65], ["crack", 17.39]], null, null], "duration": [1.73, 0.27, 21.95, 4.57, 17.19, 2.16, 5.6, 3.75, 6.25, 1.15, 9.7, 2.75, 2.3, 1.2, 3.94, 5.41, 6.63, 2.53, 9.92, 4.55, -0.05, 0.02, 3.75, 3.04, 2.74, 11.16, 5.22, 7.42]} \ No newline at end of file diff --git a/annotations_filtered/wbVpwsKbFCU_filtered.json b/annotations_filtered/wbVpwsKbFCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c56460d89cfb81f8fa7716356738a123da425b5e --- /dev/null +++ b/annotations_filtered/wbVpwsKbFCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.09], [10.0, 11.06], [12.0, 23.11], [25.0, 28.36], [29.0, 34.4], [35.0, 35.41]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.64, 30.43, 44.55, 0.0], "audiomae_on_audioset": [null, null, [["music", 80.77], ["electronic music", 3.46], ["techno", 3.0]], [["music", 73.39], ["electronic music", 7.23], ["throbbing", 2.26]], [["music", 27.62], ["foghorn", 23.11], ["speech", 19.07]], null], "duration": [1.09, 1.06, 11.11, 3.36, 5.4, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/wbccgEaJudM_filtered.json b/annotations_filtered/wbccgEaJudM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04885406037f44327566a24c935eba62479c741 --- /dev/null +++ b/annotations_filtered/wbccgEaJudM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 33.29], [37.0, 36.91], [37.0, 39.99], [44.0, 45.33], [46.0, 51.19], [53.0, 54.92], [56.0, 57.91], [60.0, 63.48], [64.0, 69.62], [71.0, 75.76], [76.0, 105.66], [112.0, 124.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [94.22, 0.0, 64.86, 0.0, 73.51, 0.0, 0.0, 94.22, 79.07, 83.16, 42.81, 32.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.63], ["speech", 8.2], ["didgeridoo", 5.94]], [["speech", 36.85], ["hum", 6.88], ["car", 6.33]]], "duration": [2.29, -0.09, 2.99, 1.33, 5.19, 1.92, 1.91, 3.48, 5.62, 4.76, 29.66, 12.5]} \ No newline at end of file diff --git a/annotations_filtered/wbt-sAOjnQQ_filtered.json b/annotations_filtered/wbt-sAOjnQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8a92dcf235b79e07ff84e79e757df0f808dd712 --- /dev/null +++ b/annotations_filtered/wbt-sAOjnQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [5.0, 5.76], [8.0, 9.1], [13.0, 13.78], [14.0, 14.32], [19.0, 18.87], [20.0, 20.8], [22.0, 22.37], [24.0, 24.51], [33.0, 33.24], [35.0, 35.67], [42.0, 42.84], [52.0, 53.96], [64.0, 64.12], [65.0, 65.7], [71.0, 71.39], [79.0, 78.85], [88.0, 88.37], [97.0, 97.09], [105.0, 105.12], [107.0, 108.14], [108.0, 110.73], [115.0, 115.53], [117.0, 117.39], [140.0, 140.9], [141.0, 141.15], [144.0, 144.78], [151.0, 151.14], [152.0, 152.27], [159.0, 159.14], [161.0, 161.99], [164.0, 164.86], [166.0, 166.11], [170.0, 170.21], [178.0, 178.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.01, 0.76, 1.1, 0.78, 0.32, -0.13, 0.8, 0.37, 0.51, 0.24, 0.67, 0.84, 1.96, 0.12, 0.7, 0.39, -0.15, 0.37, 0.09, 0.12, 1.14, 2.73, 0.53, 0.39, 0.9, 0.15, 0.78, 0.14, 0.27, 0.14, 0.99, 0.86, 0.11, 0.21, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/wbwXHxqxDwc_filtered.json b/annotations_filtered/wbwXHxqxDwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70c480f16eef32ec4f76da2b3b3f08fbbda21cc4 --- /dev/null +++ b/annotations_filtered/wbwXHxqxDwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.82], [24.0, 23.75], [24.0, 25.86], [32.0, 42.74], [44.0, 45.71], [47.0, 47.06], [48.0, 48.37], [49.0, 51.22], [55.0, 55.53], [57.0, 57.92], [58.0, 59.22], [61.0, 63.56], [66.0, 66.24], [67.0, 68.22], [70.0, 70.36], [71.0, 71.32], [72.0, 72.94], [74.0, 77.21], [92.0, 101.04], [105.0, 106.79], [107.0, 111.3], [114.0, 114.56], [117.0, 118.4], [120.0, 120.88], [122.0, 129.19], [129.0, 133.73], [135.0, 135.65], [136.0, 136.53], [138.0, 138.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.4, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 37.2, 0.0, 36.39, 0.0, 0.0, 0.0, 37.57, 48.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.15], ["hum", 13.36], ["radio", 8.54]], null, [["speech", 52.04], ["radio", 30.03], ["sidetone", 5.61]], null, null, null, [["noise", 40.09], ["sidetone", 25.25], ["speech", 7.17]], [["whale vocalization", 75.97], ["mains hum", 6.65], ["hum", 2.74]], null, null, null], "duration": [0.82, -0.25, 1.86, 10.74, 1.71, 0.06, 0.37, 2.22, 0.53, 0.92, 1.22, 2.56, 0.24, 1.22, 0.36, 0.32, 0.94, 3.21, 9.04, 1.79, 4.3, 0.56, 1.4, 0.88, 7.19, 4.73, 0.65, 0.53, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/wcenhpP37sg_filtered.json b/annotations_filtered/wcenhpP37sg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2001d17e31a61453d46f56f6e795c6c015f41579 --- /dev/null +++ b/annotations_filtered/wcenhpP37sg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [2.0, 3.89], [5.0, 7.79], [10.0, 11.1], [13.0, 15.96], [17.0, 19.13], [20.0, 24.26], [27.0, 27.41], [29.0, 29.54], [31.0, 31.6], [34.0, 36.19], [38.0, 38.74], [42.0, 43.21], [44.0, 45.49], [46.0, 48.03], [53.0, 53.96], [54.0, 68.52], [70.0, 70.51], [72.0, 71.95], [73.0, 74.11], [77.0, 78.71], [80.0, 85.38], [86.0, 88.18], [91.0, 93.73], [95.0, 95.69], [98.0, 99.74], [102.0, 104.5], [106.0, 109.85], [111.0, 113.68], [114.0, 117.95], [119.0, 122.76], [124.0, 125.42], [129.0, 150.79], [161.0, 166.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.98, 100.0, 100.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 55.31, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 95.23, 43.64, 78.55, 0.0, 0.0, 94.95, 82.97, 97.83, 52.98, 74.76, 0.0, 33.19, 29.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.7], ["applause", 5.01], ["musical instrument", 2.64]], null, null, null, null, null, [["music", 28.67], ["speech", 15.34], ["whale vocalization", 11.91]], null, null, null, null, null, null, null, null, null, [["music", 57.67], ["synthesizer", 11.69], ["theremin", 10.58]], [["music", 18.24], ["gunshot, gunfire", 13.19], ["speech", 8.93]]], "duration": [0.34, 1.89, 2.79, 1.1, 2.96, 2.13, 4.26, 0.41, 0.54, 0.6, 2.19, 0.74, 1.21, 1.49, 2.03, 0.96, 14.52, 0.51, -0.05, 1.11, 1.71, 5.38, 2.18, 2.73, 0.69, 1.74, 2.5, 3.85, 2.68, 3.95, 3.76, 1.42, 21.79, 5.55]} \ No newline at end of file diff --git a/annotations_filtered/wcjCEUeC8nk_filtered.json b/annotations_filtered/wcjCEUeC8nk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6492c5a32507fc43769ec4e4abf5bc8049dbe912 --- /dev/null +++ b/annotations_filtered/wcjCEUeC8nk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [9.0, 15.94], [16.0, 23.26], [24.0, 24.49], [29.0, 29.4], [36.0, 36.83], [37.0, 39.04], [40.0, 45.33], [47.0, 51.29], [54.0, 69.75], [72.0, 73.87], [75.0, 76.81], [78.0, 78.54], [79.0, 79.32], [84.0, 136.73], [138.0, 139.4], [141.0, 157.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.0, 36.2, 0.0, 0.0, 0.0, 62.37, 99.05, 48.52, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.52], "audiomae_on_audioset": [null, null, [["speech", 64.5], ["grunt", 6.28], ["beatboxing", 5.17]], null, null, null, null, null, [["speech", 37.37], ["music", 5.14], ["fart", 4.78]], [["music", 67.91], ["speech", 4.45], ["throbbing", 4.09]], null, null, null, null, null, null, [["music", 54.71], ["speech", 11.21], ["theremin", 7.14]]], "duration": [1.46, 6.94, 7.26, 0.49, 0.4, 0.83, 2.04, 5.33, 4.29, 15.75, 1.87, 1.81, 0.54, 0.32, 52.73, 1.4, 16.28]} \ No newline at end of file diff --git a/annotations_filtered/wcztDZ13TLI_filtered.json b/annotations_filtered/wcztDZ13TLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f462e2b6afd48be334b1553e19de1f4f6cdaabcb --- /dev/null +++ b/annotations_filtered/wcztDZ13TLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.71], [15.0, 15.6], [41.0, 42.99], [45.0, 45.2], [48.0, 48.09], [81.0, 81.68], [82.0, 82.95], [84.0, 84.6], [88.0, 88.57], [90.0, 90.75], [91.0, 92.15], [92.0, 94.31], [96.0, 96.94], [97.0, 97.63], [102.0, 103.17], [104.0, 105.44], [107.0, 107.89], [110.0, 111.37], [114.0, 114.56], [117.0, 117.37], [121.0, 123.03], [128.0, 128.66], [132.0, 133.76], [136.0, 136.76], [137.0, 137.49], [141.0, 140.75], [143.0, 143.48], [146.0, 146.31], [147.0, 149.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31], "audiomae_on_audioset": [[["speech", 61.14], ["music", 11.25], ["theremin", 3.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.71, 0.6, 1.99, 0.2, 0.09, 0.68, 0.95, 0.6, 0.57, 0.75, 1.15, 2.31, 0.94, 0.63, 1.17, 1.44, 0.89, 1.37, 0.56, 0.37, 2.03, 0.66, 1.76, 0.76, 0.49, -0.25, 0.48, 0.31, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/wdAXjMj6mfU_filtered.json b/annotations_filtered/wdAXjMj6mfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..658563bb970f0fa4d06aa2d5abfa7da1455f624d --- /dev/null +++ b/annotations_filtered/wdAXjMj6mfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [4.0, 5.9], [7.0, 7.33], [9.0, 10.42], [12.0, 12.68], [18.0, 18.79], [21.0, 20.85], [23.0, 23.67], [25.0, 26.13], [32.0, 51.83], [55.0, 54.92], [56.0, 58.87], [59.0, 61.84], [62.0, 97.85], [99.0, 100.85], [102.0, 104.23], [105.0, 106.39], [108.0, 130.77]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 0.0, 31.2, 30.11, 0.0, 0.0, 95.51, 0.0, 42.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 30.51], ["cowbell", 20.63], ["music", 13.68]], null, [["music", 67.12], ["speech", 2.55], ["throbbing", 2.38]], [["music", 48.62], ["speech", 16.76], ["whack, thwack", 4.53]], null, null, null, null, [["music", 62.49], ["clang", 5.09], ["inside, small room", 2.4]]], "duration": [0.0, 1.9, 0.33, 1.42, 0.68, 0.79, -0.15, 0.67, 1.13, 19.83, -0.08, 2.87, 2.84, 35.85, 1.85, 2.23, 1.39, 22.77]} \ No newline at end of file diff --git a/annotations_filtered/wdB2lzxIfGg_filtered.json b/annotations_filtered/wdB2lzxIfGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6c857ed006104e60f18a087f10aa7fb45683288 --- /dev/null +++ b/annotations_filtered/wdB2lzxIfGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [13.0, 14.52], [18.0, 18.05], [21.0, 21.27], [23.0, 24.34], [27.0, 27.43], [28.0, 29.05], [31.0, 32.1], [34.0, 35.67], [37.0, 38.13], [40.0, 40.91], [42.0, 42.47], [44.0, 44.58], [48.0, 49.15], [53.0, 52.84], [57.0, 58.78], [61.0, 61.55], [63.0, 62.88], [67.0, 67.36], [69.0, 70.68], [73.0, 73.85], [79.0, 80.01], [81.0, 82.09], [84.0, 84.43], [85.0, 85.62], [86.0, 86.22], [89.0, 89.92], [91.0, 92.53], [93.0, 94.17], [96.0, 97.09], [98.0, 99.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 1.52, 0.05, 0.27, 1.34, 0.43, 1.05, 1.1, 1.67, 1.13, 0.91, 0.47, 0.58, 1.15, -0.16, 1.78, 0.55, -0.12, 0.36, 1.68, 0.85, 1.01, 1.09, 0.43, 0.62, 0.22, 0.92, 1.53, 1.17, 1.09, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/wdS1l__SWms_filtered.json b/annotations_filtered/wdS1l__SWms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67cf93df51e32a873d79996f48079dd515e0b87f --- /dev/null +++ b/annotations_filtered/wdS1l__SWms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.79], [19.0, 40.58], [42.0, 44.98], [48.0, 81.99], [83.0, 83.07], [84.0, 84.48], [85.0, 91.49], [100.0, 100.08], [100.0, 108.87], [114.0, 119.25], [120.0, 121.07], [123.0, 122.76], [125.0, 125.54], [126.0, 126.6], [128.0, 128.44], [130.0, 130.94], [136.0, 144.22], [146.0, 172.35]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, true, true], "silence_prob": [42.88, 31.19, 36.8, 0.0, 0.0, 0.0, 31.44, 0.0, 33.58, 42.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.05, 32.2], "audiomae_on_audioset": [[["music", 36.98], ["speech", 21.4], ["theremin", 5.32]], [["music", 85.67], ["musical instrument", 2.89], ["brass instrument", 2.02]], [["music", 42.69], ["musical instrument", 5.84], ["hum", 4.93]], null, null, null, [["speech", 32.7], ["fart", 22.02], ["music", 18.27]], null, [["speech", 20.83], ["didgeridoo", 18.68], ["music", 15.78]], [["music", 40.28], ["theremin", 9.54], ["whack, thwack", 6.79]], null, null, null, null, null, null, [["music", 45.94], ["speech", 14.4], ["foghorn", 7.23]], [["music", 61.58], ["musical instrument", 4.2], ["theremin", 3.63]]], "duration": [8.79, 21.58, 2.98, 33.99, 0.07, 0.48, 6.49, 0.08, 8.87, 5.25, 1.07, -0.24, 0.54, 0.6, 0.44, 0.94, 8.22, 26.35]} \ No newline at end of file diff --git a/annotations_filtered/wdVtcHMYAM4_filtered.json b/annotations_filtered/wdVtcHMYAM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aed65552475803c2a090608290bb8e03958d297d --- /dev/null +++ b/annotations_filtered/wdVtcHMYAM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [3.0, 27.31], [28.0, 28.39], [30.0, 30.32], [32.0, 33.2], [35.0, 35.53], [36.0, 67.31], [71.0, 73.18], [74.0, 76.17], [78.0, 92.33], [101.0, 100.72], [101.0, 102.39]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 48.23, 37.97, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.25], ["breaking", 26.7], ["thunk", 12.93]], null, null, null, null, null, null, [["frog", 27.76], ["music", 24.01], ["sidetone", 10.19]], [["music", 62.72], ["speech", 13.82], ["echo", 2.32]], null, null], "duration": [-0.06, 24.31, 0.39, 0.32, 1.2, 0.53, 31.31, 2.18, 2.17, 14.33, -0.28, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/wdcRrpMHIGM_filtered.json b/annotations_filtered/wdcRrpMHIGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eeb61164c312f49cfca5c8be898d4d12370c9d7 --- /dev/null +++ b/annotations_filtered/wdcRrpMHIGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [6.0, 7.11], [8.0, 9.71], [11.0, 13.1], [15.0, 20.16], [21.0, 23.99], [25.0, 25.08], [27.0, 29.51], [34.0, 40.15], [42.0, 43.12], [44.0, 45.42], [46.0, 48.17], [50.0, 55.27], [57.0, 62.97], [63.0, 112.5], [114.0, 116.38], [120.0, 120.9], [122.0, 123.69], [125.0, 180.49], [183.0, 184.08], [185.0, 185.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.1, 0.0, 0.0, 35.88, 32.61, 37.37, 0.0, 29.84, 42.24, 0.0, 0.0, 34.6, 29.01, 30.38, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 30.98], ["mains hum", 27.74], ["speech", 16.46]], null, null, [["mains hum", 48.44], ["hum", 25.09], ["music", 8.9]], [["music", 40.74], ["mains hum", 20.32], ["hum", 20.07]], [["mains hum", 35.43], ["hum", 22.75], ["music", 15.08]], null, [["music", 71.94], ["didgeridoo", 7.28], ["theremin", 2.5]], [["music", 56.85], ["hum", 9.96], ["didgeridoo", 7.47]], null, null, [["speech", 26.72], ["mains hum", 26.59], ["hum", 17.16]], [["music", 71.58], ["reverberation", 4.69], ["scary music", 3.13]], [["music", 50.8], ["speech", 21.02], ["mains hum", 5.22]], null, null, null, null, null, null, null], "duration": [3.68, 1.11, 1.71, 2.1, 5.16, 2.99, 0.08, 2.51, 6.15, 1.12, 1.42, 2.17, 5.27, 5.97, 49.5, 2.38, 0.9, 1.69, 55.49, 1.08, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/wdrhl_I3-E8_filtered.json b/annotations_filtered/wdrhl_I3-E8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adc99662db66730c8abe2165d705866965e7041f --- /dev/null +++ b/annotations_filtered/wdrhl_I3-E8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.14], [10.0, 9.86], [10.0, 11.26], [12.0, 11.99], [14.0, 14.99], [16.0, 16.75], [17.0, 18.23], [19.0, 20.22], [22.0, 23.21], [25.0, 41.84], [42.0, 43.66], [46.0, 46.74], [52.0, 52.0], [62.0, 62.78], [65.0, 66.11], [67.0, 68.44], [71.0, 71.51], [72.0, 72.47], [75.0, 76.23], [76.0, 76.37], [76.0, 76.47], [84.0, 83.81], [87.0, 87.79], [89.0, 90.66], [95.0, 95.91], [97.0, 98.14], [103.0, 104.19], [106.0, 106.12], [109.0, 109.7], [113.0, 113.56], [114.0, 114.51], [117.0, 117.17], [122.0, 121.86], [128.0, 128.46], [130.0, 137.13], [139.0, 142.74], [144.0, 146.79], [147.0, 147.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 43.96, 85.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 87.53], ["telephone", 4.03], ["telephone dialing, dtmf", 1.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.3], ["music", 4.38], ["hum", 3.94]], [["music", 26.91], ["frog", 8.29], ["animal", 7.88]], null, null], "duration": [1.14, -0.14, 1.26, -0.01, 0.99, 0.75, 1.23, 1.22, 1.21, 16.84, 1.66, 0.74, 0.0, 0.78, 1.11, 1.44, 0.51, 0.47, 1.23, 0.37, 0.47, -0.19, 0.79, 1.66, 0.91, 1.14, 1.19, 0.12, 0.7, 0.56, 0.51, 0.17, -0.14, 0.46, 7.13, 3.74, 2.79, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/weCxCxIIjHA_filtered.json b/annotations_filtered/weCxCxIIjHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93efbc55ebef78c5c56adb214d1e2cebd0ae6863 --- /dev/null +++ b/annotations_filtered/weCxCxIIjHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [5.0, 6.18], [16.0, 21.0]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 46.33], "audiomae_on_audioset": [null, null, [["music", 41.7], ["hum", 11.31], ["speech", 9.72]]], "duration": [1.27, 1.18, 5.0]} \ No newline at end of file diff --git a/annotations_filtered/weDm19eMl8Y_filtered.json b/annotations_filtered/weDm19eMl8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09476a91355f5404abe037e5feb084f33dbe879c --- /dev/null +++ b/annotations_filtered/weDm19eMl8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.32], [19.0, 31.82], [42.0, 43.01], [45.0, 45.39], [46.0, 53.62], [55.0, 56.49], [58.0, 59.05], [60.0, 60.94], [61.0, 63.09], [65.0, 69.74], [70.0, 70.85], [72.0, 74.56], [76.0, 76.59], [79.0, 80.2], [84.0, 90.02], [91.0, 91.5], [98.0, 98.73], [102.0, 106.61], [111.0, 112.01], [114.0, 116.19], [118.0, 118.25], [120.0, 121.66], [123.0, 125.42]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, false, true, false, false, true], "silence_prob": [30.42, 30.26, 0.0, 0.0, 46.57, 0.0, 0.0, 0.0, 44.81, 40.92, 0.0, 54.63, 0.0, 0.0, 40.4, 0.0, 0.0, 36.72, 0.0, 38.84, 0.0, 0.0, 37.13], "audiomae_on_audioset": [[["music", 85.33], ["didgeridoo", 2.16], ["choir", 2.03]], [["music", 81.3], ["didgeridoo", 6.02], ["theremin", 1.3]], null, null, [["hum", 30.26], ["mains hum", 25.92], ["electric shaver, electric razor", 17.6]], null, null, null, [["speech", 15.71], ["music", 13.23], ["gears", 5.77]], [["speech", 30.66], ["hum", 13.3], ["music", 10.83]], null, null, null, null, [["music", 35.98], ["mains hum", 20.62], ["hum", 11.61]], null, null, [["siren", 18.53], ["fire engine, fire truck (siren)", 15.46], ["vehicle", 13.81]], null, [["mains hum", 23.26], ["hum", 22.13], ["whale vocalization", 21.8]], null, null, [["music", 57.71], ["singing", 5.66], ["musical instrument", 4.01]]], "duration": [14.32, 12.82, 1.01, 0.39, 7.62, 1.49, 1.05, 0.94, 2.09, 4.74, 0.85, 2.56, 0.59, 1.2, 6.02, 0.5, 0.73, 4.61, 1.01, 2.19, 0.25, 1.66, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/weEay_Y4EeE_filtered.json b/annotations_filtered/weEay_Y4EeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d94dab36a48dd25b413f0dfffb5509735eb2bf48 --- /dev/null +++ b/annotations_filtered/weEay_Y4EeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.34], [36.0, 51.41], [52.0, 52.2]], "keep_status": [false, false, false], "silence_prob": [97.64, 83.7, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [8.34, 15.41, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/weHHBdmI_Jw_filtered.json b/annotations_filtered/weHHBdmI_Jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12547f2060e6831e9a982d4d76203fe8f8d4469b --- /dev/null +++ b/annotations_filtered/weHHBdmI_Jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.75], [22.0, 26.57], [28.0, 27.94], [30.0, 39.75], [42.0, 49.91], [54.0, 71.05], [71.0, 81.45], [84.0, 97.09], [99.0, 100.75], [102.0, 110.42], [113.0, 115.84], [117.0, 117.49], [118.0, 119.06], [124.0, 127.2]], "keep_status": [false, true, false, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 32.99, 0.0, 31.12, 31.79, 31.84, 30.93, 36.41, 0.0, 71.14, 81.53, 0.0, 0.0, 41.42], "audiomae_on_audioset": [null, [["music", 50.64], ["boing", 13.72], ["throbbing", 3.89]], null, [["speech", 25.25], ["vehicle", 9.61], ["music", 8.57]], [["speech", 46.01], ["music", 8.56], ["hum", 8.38]], [["speech", 35.95], ["music", 27.11], ["fart", 8.11]], [["speech", 48.35], ["music", 29.61], ["explosion", 1.94]], [["music", 58.71], ["noise", 7.06], ["synthesizer", 5.2]], null, null, null, null, null, [["music", 31.03], ["speech", 11.22], ["theremin", 6.22]]], "duration": [1.75, 4.57, -0.06, 9.75, 7.91, 17.05, 10.45, 13.09, 1.75, 8.42, 2.84, 0.49, 1.06, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/weTmdGoN_SQ_filtered.json b/annotations_filtered/weTmdGoN_SQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7c6e731ae03332a069594641676768f47a483c3 --- /dev/null +++ b/annotations_filtered/weTmdGoN_SQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.09], [5.0, 7.06], [10.0, 10.83], [14.0, 15.75], [21.0, 22.96], [24.0, 31.11], [37.0, 36.98], [40.0, 40.86], [43.0, 43.44], [46.0, 48.78], [52.0, 53.59], [56.0, 56.84], [59.0, 61.48], [63.0, 67.05], [68.0, 78.07], [84.0, 83.76], [86.0, 86.1], [93.0, 93.97]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [44.15, 99.9, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 45.98, 86.82, 71.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["thunk", 53.74], ["music", 6.05], ["hum", 3.73]], null, null, null, null, [["speech", 82.02], ["sidetone", 5.29], ["music", 3.48]], null, null, null, null, null, null, [["tuning fork", 49.73], ["synthesizer", 9.69], ["music", 8.36]], null, null, null, null, null], "duration": [4.09, 2.06, 0.83, 1.75, 1.96, 7.11, -0.02, 0.86, 0.44, 2.78, 1.59, 0.84, 2.48, 4.05, 10.07, -0.24, 0.1, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/wek_o4V_T00_filtered.json b/annotations_filtered/wek_o4V_T00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..211b5cfcb0d84ae6cfa2b2ba0341ed2091920d68 --- /dev/null +++ b/annotations_filtered/wek_o4V_T00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.4], [15.0, 25.12], [26.0, 25.93], [28.0, 47.6], [50.0, 64.94], [67.0, 75.2], [83.0, 86.85], [92.0, 93.28]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [54.97, 51.23, 0.0, 56.78, 60.23, 55.39, 29.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 58.73], ["musical instrument", 3.24], ["boing", 2.49]], null], "duration": [2.4, 10.12, -0.07, 19.6, 14.94, 8.2, 3.85, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/wf-gIUYRCyk_filtered.json b/annotations_filtered/wf-gIUYRCyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..178350336dfac772f153cfe3bf7e546f9d68192d --- /dev/null +++ b/annotations_filtered/wf-gIUYRCyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [6.0, 6.08], [7.0, 7.67], [8.0, 8.06], [12.0, 13.07], [17.0, 17.63], [18.0, 19.14], [23.0, 23.14], [30.0, 31.29], [35.0, 38.84], [40.0, 43.04], [45.0, 45.72], [47.0, 48.79], [61.0, 66.23], [68.0, 93.75], [95.0, 95.27], [97.0, 97.38], [101.0, 100.63], [103.0, 103.84], [105.0, 108.08], [109.0, 109.98], [115.0, 114.88], [117.0, 121.31], [121.0, 121.44], [124.0, 125.58], [130.0, 131.82], [135.0, 135.24], [141.0, 141.3], [142.0, 143.88], [148.0, 149.89], [153.0, 160.24], [162.0, 166.82], [168.0, 169.86], [170.0, 171.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 88.1, 0.0, 0.0, 36.94, 59.77, 0.0, 0.0, 0.0, 0.0, 31.54, 0.0, 0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 65.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.62], ["whack, thwack", 7.55], ["wood", 5.85]], null, null, null, null, null, [["speech", 43.9], ["grunt", 15.44], ["screaming", 8.77]], null, null, [["grunt", 41.69], ["burping, eructation", 18.34], ["speech", 12.26]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.08, 0.67, 0.06, 1.07, 0.63, 1.14, 0.14, 1.29, 3.84, 3.04, 0.72, 1.79, 5.23, 25.75, 0.27, 0.38, -0.37, 0.84, 3.08, 0.98, -0.12, 4.31, 0.44, 1.58, 1.82, 0.24, 0.3, 1.88, 1.89, 7.24, 4.82, 1.86, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/wfAfwKUkfHU_filtered.json b/annotations_filtered/wfAfwKUkfHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d154451d52333e69f12b256f628b1811063561 --- /dev/null +++ b/annotations_filtered/wfAfwKUkfHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.32], [16.0, 20.87], [22.0, 44.64], [46.0, 47.68], [49.0, 49.99], [51.0, 53.74], [56.0, 57.81], [59.0, 60.54], [65.0, 65.48], [67.0, 77.62], [78.0, 79.57], [82.0, 83.69], [85.0, 90.83], [94.0, 102.12], [103.0, 107.4], [109.0, 112.08], [116.0, 120.07], [122.0, 123.99], [125.0, 126.28], [130.0, 138.5], [140.0, 141.02], [142.0, 143.94], [147.0, 149.66], [151.0, 153.1], [154.0, 155.88], [158.0, 164.22], [166.0, 170.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 80.46, 59.77, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 58.72, 37.08, 53.04, 55.81, 53.4, 0.0, 0.0, 76.2, 0.0, 0.0, 97.33, 98.8, 0.0, 70.86, 45.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.26], ["soundtrack music", 6.37], ["scary music", 5.65]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.51], ["hum", 9.79], ["whale vocalization", 7.19]]], "duration": [1.32, 4.87, 22.64, 1.68, 0.99, 2.74, 1.81, 1.54, 0.48, 10.62, 1.57, 1.69, 5.83, 8.12, 4.4, 3.08, 4.07, 1.99, 1.28, 8.5, 1.02, 1.94, 2.66, 2.1, 1.88, 6.22, 4.36]} \ No newline at end of file diff --git a/annotations_filtered/wfbqJpn8fN8_filtered.json b/annotations_filtered/wfbqJpn8fN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5f9ca4eb50a8997fe88ae2eab2199120fcbb9e5 --- /dev/null +++ b/annotations_filtered/wfbqJpn8fN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 38.7], [39.0, 49.37], [51.0, 51.38], [52.0, 52.34], [55.0, 54.85], [56.0, 57.3], [60.0, 61.21], [62.0, 62.46], [63.0, 65.31], [68.0, 68.94], [74.0, 74.95], [75.0, 75.64], [78.0, 78.6], [79.0, 80.25], [86.0, 86.02], [90.0, 90.12], [91.0, 91.99], [93.0, 96.94], [108.0, 110.22], [112.0, 114.02], [116.0, 122.28], [124.0, 127.92]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [79.41, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.02, 31.04, 37.77, 31.05, 41.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 21.88], ["heart sounds, heartbeat", 19.98], ["music", 8.34]], null, null, null, null, null, null, null, null, [["mains hum", 32.74], ["hum", 27.62], ["throbbing", 6.55]], [["speech", 24.47], ["noise", 19.11], ["sidetone", 12.21]], [["speech", 34.98], ["hum", 29.15], ["mains hum", 19.59]], [["boing", 35.02], ["breaking", 24.98], ["speech", 22.42]], [["noise", 45.35], ["hum", 6.65], ["fly, housefly", 5.4]]], "duration": [18.7, 10.37, 0.38, 0.34, -0.15, 1.3, 1.21, 0.46, 2.31, 0.94, 0.95, 0.64, 0.6, 1.25, 0.02, 0.12, 0.99, 3.94, 2.22, 2.02, 6.28, 3.92]} \ No newline at end of file diff --git a/annotations_filtered/wfq7O3AgXdE_filtered.json b/annotations_filtered/wfq7O3AgXdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc9a5620bc8bfcbbd0e93498df651f931c7ff964 --- /dev/null +++ b/annotations_filtered/wfq7O3AgXdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.12], [6.0, 7.48], [8.0, 10.02], [15.0, 16.43], [17.0, 17.61], [18.0, 18.99], [20.0, 19.8], [23.0, 24.16], [36.0, 36.73], [39.0, 39.58], [45.0, 45.89], [47.0, 47.22], [49.0, 49.13], [53.0, 53.15], [56.0, 56.62], [61.0, 61.32], [62.0, 69.08], [70.0, 70.51], [71.0, 71.69], [76.0, 76.54], [79.0, 79.89], [82.0, 82.07], [82.0, 84.03], [86.0, 87.22], [88.0, 88.84], [90.0, 90.41], [93.0, 94.14], [94.0, 98.12], [98.0, 101.28], [106.0, 106.78], [108.0, 107.82], [110.0, 126.49], [127.0, 127.62], [128.0, 132.04], [136.0, 136.49], [137.0, 137.81], [141.0, 142.79], [144.0, 144.19], [147.0, 148.2], [149.0, 150.82], [151.0, 152.36], [154.0, 161.27], [163.0, 169.82], [171.0, 174.46], [176.0, 176.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.16, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 99.05, 95.09, 0.0, 0.0, 63.53, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 86.27, 91.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.12, 1.48, 2.02, 1.43, 0.61, 0.99, -0.2, 1.16, 0.73, 0.58, 0.89, 0.22, 0.13, 0.15, 0.62, 0.32, 7.08, 0.51, 0.69, 0.54, 0.89, 0.07, 2.03, 1.22, 0.84, 0.41, 1.14, 4.12, 3.28, 0.78, -0.18, 16.49, 0.62, 4.04, 0.49, 0.81, 1.79, 0.19, 1.2, 1.82, 1.36, 7.27, 6.82, 3.46, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/wgHRj2-vvs8_filtered.json b/annotations_filtered/wgHRj2-vvs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..056175986736400f4eb4e5479e7b30dac20aad7d --- /dev/null +++ b/annotations_filtered/wgHRj2-vvs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 72.98], [76.0, 89.7], [90.0, 89.73], [90.0, 89.77], [90.0, 89.83], [91.0, 95.99]], "keep_status": [false, true, false, false, false, true], "silence_prob": [0.0, 34.84, 0.0, 0.0, 0.0, 32.9], "audiomae_on_audioset": [null, [["speech", 30.01], ["gunshot, gunfire", 20.1], ["machine gun", 14.58]], null, null, null, [["speech", 40.55], ["quack", 9.59], ["gunshot, gunfire", 6.08]]], "duration": [60.98, 13.7, -0.27, -0.23, -0.17, 4.99]} \ No newline at end of file diff --git a/annotations_filtered/wgkxKdTVrHo_filtered.json b/annotations_filtered/wgkxKdTVrHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d179b4ca00dff06d94cf1f899c28f5cd90a5e87 --- /dev/null +++ b/annotations_filtered/wgkxKdTVrHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [3.0, 6.78], [7.0, 7.8], [9.0, 10.64], [14.0, 16.88], [19.0, 24.07], [26.0, 27.4], [28.0, 29.84], [32.0, 43.58], [44.0, 48.3], [50.0, 50.11], [56.0, 56.96], [63.0, 63.48], [64.0, 75.47], [77.0, 79.66], [84.0, 84.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 0.0, 99.05, 77.36, 0.0, 0.0, 34.73, 42.58, 0.0, 0.0, 0.0, 54.3, 53.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 71.15], ["musical instrument", 5.17], ["didgeridoo", 3.46]], [["music", 60.8], ["frog", 6.66], ["speech", 6.23]], null, null, null, null, null, null], "duration": [0.4, 3.78, 0.8, 1.64, 2.88, 5.07, 1.4, 1.84, 11.58, 4.3, 0.11, 0.96, 0.48, 11.47, 2.66, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/wgzxSr6l9Y4_filtered.json b/annotations_filtered/wgzxSr6l9Y4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e8b0b7813da31e6c4271cbc80d384aa4d629cd5 --- /dev/null +++ b/annotations_filtered/wgzxSr6l9Y4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.13], [14.0, 18.33], [22.0, 114.44], [115.0, 114.52]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.13, 4.33, 92.44, -0.48]} \ No newline at end of file diff --git a/annotations_filtered/whCKn6cV-0k_filtered.json b/annotations_filtered/whCKn6cV-0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7bcb688af896e16bd194ff5b3fe05b4ff617a2a --- /dev/null +++ b/annotations_filtered/whCKn6cV-0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [5.0, 6.08], [6.0, 9.0], [10.0, 9.88], [15.0, 15.42], [18.0, 19.01], [21.0, 22.11], [23.0, 24.19], [25.0, 26.23], [28.0, 28.54], [29.0, 29.94], [30.0, 31.62], [42.0, 42.55], [43.0, 43.61], [47.0, 47.58], [49.0, 50.43], [54.0, 53.81], [55.0, 55.07], [67.0, 69.6], [70.0, 73.3], [76.0, 75.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 89.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 1.08, 3.0, -0.12, 0.42, 1.01, 1.11, 1.19, 1.23, 0.54, 0.94, 1.62, 0.55, 0.61, 0.58, 1.43, -0.19, 0.07, 2.6, 3.3, -0.36]} \ No newline at end of file diff --git a/annotations_filtered/whFoAKQ10gY_filtered.json b/annotations_filtered/whFoAKQ10gY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca7cbcac144e86918c3d93bcb52e02fe5a714b01 --- /dev/null +++ b/annotations_filtered/whFoAKQ10gY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.71], [17.0, 19.01], [20.0, 22.1], [23.0, 23.18], [26.0, 34.21], [44.0, 44.76], [55.0, 55.09], [55.0, 56.54]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 51.66, 43.71, 0.0, 58.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.45], ["musical instrument", 6.91], ["guitar", 6.72]], null, null, null, null, null], "duration": [0.71, 2.01, 2.1, 0.18, 8.21, 0.76, 0.09, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/whUo8sI5OuY_filtered.json b/annotations_filtered/whUo8sI5OuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8df21f0f379ab27f786493af960dd44a7bd37cc7 --- /dev/null +++ b/annotations_filtered/whUo8sI5OuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.72], [10.0, 9.78], [14.0, 22.03], [25.0, 30.82], [35.0, 49.65], [57.0, 57.81], [59.0, 84.21], [88.0, 108.9]], "keep_status": [true, false, true, false, true, false, true, false], "silence_prob": [33.99, 0.0, 35.55, 30.76, 31.64, 0.0, 32.01, 32.34], "audiomae_on_audioset": [[["music", 46.55], ["mains hum", 7.66], ["hum", 6.17]], null, [["music", 39.64], ["theremin", 10.08], ["scary music", 8.84]], [["music", 52.84], ["cacophony", 16.91], ["throbbing", 3.94]], [["music", 54.43], ["electronic music", 7.45], ["hum", 4.53]], null, [["music", 33.5], ["noise", 23.54], ["theremin", 12.38]], [["music", 55.94], ["hum", 16.87], ["mains hum", 6.37]]], "duration": [2.72, -0.22, 8.03, 5.82, 14.65, 0.81, 25.21, 20.9]} \ No newline at end of file diff --git a/annotations_filtered/wiA6bjzz-CM_filtered.json b/annotations_filtered/wiA6bjzz-CM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d7b83f9a54c4671b7dec7c87be63d494bced268 --- /dev/null +++ b/annotations_filtered/wiA6bjzz-CM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.65], [15.0, 21.14], [22.0, 22.59], [24.0, 25.22], [27.0, 29.4], [31.0, 31.75], [33.0, 34.03], [41.0, 43.11], [44.0, 45.12], [48.0, 48.25], [49.0, 49.3], [51.0, 51.31], [54.0, 54.48], [55.0, 55.56], [59.0, 61.99], [62.0, 62.72], [66.0, 66.8], [69.0, 69.63], [71.0, 76.08], [78.0, 79.68], [81.0, 82.0], [83.0, 86.49], [88.0, 91.81], [94.0, 95.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [34.47, 36.88, 0.0, 0.0, 82.79, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 42.28, 0.0, 0.0, 100.0, 92.15, 0.0], "audiomae_on_audioset": [[["fart", 55.98], ["speech", 32.58], ["whack, thwack", 1.16]], [["speech", 44.83], ["sidetone", 34.22], ["radio", 2.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["heart sounds, heartbeat", 32.37], ["sidetone", 19.24], ["throbbing", 5.01]], null, null, null, null, null], "duration": [6.65, 6.14, 0.59, 1.22, 2.4, 0.75, 1.03, 2.11, 1.12, 0.25, 0.3, 0.31, 0.48, 0.56, 2.99, 0.72, 0.8, 0.63, 5.08, 1.68, 1.0, 3.49, 3.81, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/wirXvuRATiE_filtered.json b/annotations_filtered/wirXvuRATiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590bef5be35f88817292c80e431bc5a09dd4bdb4 --- /dev/null +++ b/annotations_filtered/wirXvuRATiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [5.0, 6.05], [11.0, 11.97], [12.0, 12.93], [20.0, 22.23], [27.0, 27.23], [28.0, 29.42], [33.0, 32.93], [38.0, 38.82], [47.0, 47.98], [53.0, 53.6], [58.0, 58.7], [59.0, 60.25], [67.0, 67.22], [68.0, 68.01], [71.0, 71.15], [112.0, 113.12], [116.0, 116.38], [117.0, 118.45], [123.0, 123.09], [124.0, 127.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 1.05, 0.97, 0.93, 2.23, 0.23, 1.42, -0.07, 0.82, 0.98, 0.6, 0.7, 1.25, 0.22, 0.01, 0.15, 1.12, 0.38, 1.45, 0.09, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/wj0aH_PiAnI_filtered.json b/annotations_filtered/wj0aH_PiAnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e7c18ec62fed6e3cc5a293df9cce96d2bc25de3 --- /dev/null +++ b/annotations_filtered/wj0aH_PiAnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [10.0, 10.17], [14.0, 13.85], [22.0, 23.41], [40.0, 40.44], [49.0, 49.5], [58.0, 58.35], [59.0, 59.58], [61.0, 61.32], [62.0, 62.55], [63.0, 63.81], [64.0, 65.25], [66.0, 67.0], [69.0, 80.25], [83.0, 85.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.28, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 49.09], ["effects unit", 6.09], ["music", 3.64]], null], "duration": [0.87, 0.17, -0.15, 1.41, 0.44, 0.5, 0.35, 0.58, 0.32, 0.55, 0.81, 1.25, 1.0, 11.25, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/wjVPv5aO_no_filtered.json b/annotations_filtered/wjVPv5aO_no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0098d186b32b27fa18784cb206261cee23472c4c --- /dev/null +++ b/annotations_filtered/wjVPv5aO_no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.95], [7.0, 8.02], [10.0, 10.66], [13.0, 12.85], [16.0, 32.83], [36.0, 78.41], [81.0, 93.14], [95.0, 99.67], [102.0, 102.59], [114.0, 114.29], [115.0, 115.62], [127.0, 127.33]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.32, 0.0, 30.16, 32.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 22.65], ["screaming", 9.38], ["whack, thwack", 6.76]], null, [["vehicle", 29.18], ["car", 19.56], ["speech", 8.34]], [["speech", 23.7], ["music", 17.85], ["noise", 6.61]], null, null, null, null], "duration": [0.95, 1.02, 0.66, -0.15, 16.83, 42.41, 12.14, 4.67, 0.59, 0.29, 0.62, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/wjkdynBFHuQ_filtered.json b/annotations_filtered/wjkdynBFHuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4102ada0539c960f6db6c1d13f02f1feb8a1c621 --- /dev/null +++ b/annotations_filtered/wjkdynBFHuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.81], [31.0, 33.51], [39.0, 39.41], [42.0, 43.87], [45.0, 46.41], [49.0, 50.23], [51.0, 50.85], [51.0, 56.78], [57.0, 57.81], [66.0, 66.8], [70.0, 72.0], [78.0, 79.34], [80.0, 81.26], [90.0, 90.53], [94.0, 94.31]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [83.52, 38.31, 0.0, 0.0, 0.0, 0.0, 0.0, 30.7, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["electric shaver, electric razor", 12.49], ["music", 10.11], ["mains hum", 9.37]], null, null, null, null, null, [["speech", 27.59], ["frog", 17.39], ["fly, housefly", 12.18]], null, null, null, null, null, null, null], "duration": [2.81, 2.51, 0.41, 1.87, 1.41, 1.23, -0.15, 5.78, 0.81, 0.8, 2.0, 1.34, 1.26, 0.53, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/wk-P07PoFAk_filtered.json b/annotations_filtered/wk-P07PoFAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23854eeeb648ed591a108d3bf5c0a80d696aa5f8 --- /dev/null +++ b/annotations_filtered/wk-P07PoFAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.28], [14.0, 20.66], [23.0, 26.35], [32.0, 33.29], [34.0, 34.75], [36.0, 45.32], [46.0, 46.72], [48.0, 48.24], [50.0, 68.44], [69.0, 73.55], [74.0, 73.67], [74.0, 76.38], [80.0, 95.81], [103.0, 156.69]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [31.07, 30.29, 29.28, 0.0, 0.0, 29.43, 0.0, 0.0, 29.66, 29.98, 0.0, 31.85, 28.56, 0.0], "audiomae_on_audioset": [[["music", 39.4], ["grunt", 22.76], ["throat clearing", 7.5]], [["mosquito", 68.46], ["fly, housefly", 22.53], ["insect", 5.51]], [["speech", 38.46], ["vehicle", 20.54], ["car", 12.62]], null, null, [["speech", 57.68], ["music", 11.14], ["vehicle", 5.14]], null, null, [["music", 70.95], ["explosion", 3.71], ["musical instrument", 3.1]], [["speech", 40.35], ["whale vocalization", 13.23], ["music", 5.64]], null, [["cattle, bovinae", 12.95], ["whale vocalization", 12.77], ["moo", 10.61]], [["music", 76.02], ["throbbing", 4.53], ["cacophony", 2.58]], null], "duration": [2.28, 6.66, 3.35, 1.29, 0.75, 9.32, 0.72, 0.24, 18.44, 4.55, -0.33, 2.38, 15.81, 53.69]} \ No newline at end of file diff --git a/annotations_filtered/wkH0WdBYT4E_filtered.json b/annotations_filtered/wkH0WdBYT4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99b7049b19ec65670a34deb35bce4887ef53899d --- /dev/null +++ b/annotations_filtered/wkH0WdBYT4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 21.39], [22.0, 24.06], [24.0, 26.76], [27.0, 28.14], [29.0, 32.22], [33.0, 34.82], [36.0, 38.75], [39.0, 40.46], [41.0, 74.87], [75.0, 116.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.21, 72.6, 61.97, 0.0, 69.74, 0.0, 87.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 46.81], ["music", 28.92], ["hum", 4.28]], null, null, null, null, null, null, null, null, null], "duration": [20.39, 2.06, 2.76, 1.14, 3.22, 1.82, 2.75, 1.46, 33.87, 41.67]} \ No newline at end of file diff --git a/annotations_filtered/wknywxfcE5M_filtered.json b/annotations_filtered/wknywxfcE5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f098187003a61fc8b710743e33ca1d8e45052079 --- /dev/null +++ b/annotations_filtered/wknywxfcE5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.1], [5.0, 5.41], [13.0, 12.99], [16.0, 17.37], [22.0, 22.42], [24.0, 23.95], [26.0, 26.76], [34.0, 35.23], [38.0, 38.37], [41.0, 41.37], [47.0, 46.87], [52.0, 54.95], [56.0, 56.62], [57.0, 58.02], [61.0, 61.86], [68.0, 68.3], [71.0, 72.89], [74.0, 74.38], [77.0, 76.76]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [30.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.53], ["didgeridoo", 16.4], ["theremin", 6.37]], null, null, null, null, null, null, null, null, null, null, [["croak", 18.79], ["frog", 17.56], ["music", 15.67]], null, null, null, null, null, null, null], "duration": [5.1, 0.41, -0.01, 1.37, 0.42, -0.05, 0.76, 1.23, 0.37, 0.37, -0.13, 2.95, 0.62, 1.02, 0.86, 0.3, 1.89, 0.38, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/wkoHQdbhfOc_filtered.json b/annotations_filtered/wkoHQdbhfOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6db43a29fa10ba798bb9e4d64a1b082898415d1 --- /dev/null +++ b/annotations_filtered/wkoHQdbhfOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.62], [26.0, 53.08], [54.0, 59.63], [62.0, 66.16], [68.0, 70.12], [73.0, 75.63], [88.0, 88.82], [90.0, 90.71], [91.0, 96.31], [98.0, 111.18], [112.0, 115.26], [116.0, 132.26], [133.0, 137.61], [138.0, 145.45], [147.0, 149.52], [152.0, 158.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.59, 58.72, 82.25, 98.99, 99.59, 84.98, 0.0, 0.0, 56.55, 73.97, 99.56, 99.48, 87.74, 56.1, 97.33, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.62, 27.08, 5.63, 4.16, 2.12, 2.63, 0.82, 0.71, 5.31, 13.18, 3.26, 16.26, 4.61, 7.45, 2.52, 6.9]} \ No newline at end of file diff --git a/annotations_filtered/wkyZ8pJD0Uo_filtered.json b/annotations_filtered/wkyZ8pJD0Uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..117085d833f5e095d5be97cdf94815e1687b1004 --- /dev/null +++ b/annotations_filtered/wkyZ8pJD0Uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [6.0, 6.98], [8.0, 9.22], [11.0, 11.6], [14.0, 14.59], [17.0, 17.19], [19.0, 19.09], [20.0, 20.95], [23.0, 24.34], [26.0, 27.7], [37.0, 37.03], [37.0, 38.25], [45.0, 45.82], [46.0, 47.7], [55.0, 54.73], [57.0, 58.56], [60.0, 61.75], [62.0, 63.9], [64.0, 65.64], [67.0, 67.81], [73.0, 74.22], [75.0, 95.15], [100.0, 102.3], [104.0, 106.19], [120.0, 120.39], [123.0, 123.53], [124.0, 125.12], [130.0, 131.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 34.82, 55.04, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["groan", 44.6], ["grunt", 18.71], ["speech", 5.14]], null, null, null, null, null], "duration": [0.65, 0.98, 1.22, 0.6, 0.59, 0.19, 0.09, 0.95, 1.34, 1.7, 0.03, 1.25, 0.82, 1.7, -0.27, 1.56, 1.75, 1.9, 1.64, 0.81, 1.22, 20.15, 2.3, 2.19, 0.39, 0.53, 1.12, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/wlFo4ydbP7c_filtered.json b/annotations_filtered/wlFo4ydbP7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..899b3a9d747d0a1f8a93e4dcd44facc70d9aad78 --- /dev/null +++ b/annotations_filtered/wlFo4ydbP7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.21], [2.0, 2.39], [3.0, 3.3], [14.0, 15.11], [37.0, 38.23], [56.0, 59.46], [71.0, 71.22], [79.0, 80.81], [89.0, 89.01], [114.0, 114.59], [116.0, 118.89], [119.0, 120.77], [127.0, 128.31], [140.0, 141.66], [142.0, 144.56], [146.0, 174.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.98, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 31.26, 31.13], "audiomae_on_audioset": [null, null, null, null, null, [["moo", 42.92], ["cattle, bovinae", 34.61], ["livestock, farm animals, working animals", 21.25]], null, null, null, null, null, null, null, null, [["speech", 22.51], ["radio", 8.3], ["whale vocalization", 7.75]], [["music", 80.05], ["synthetic singing", 4.68], ["male singing", 2.01]]], "duration": [0.21, 0.39, 0.3, 1.11, 1.23, 3.46, 0.22, 1.81, 0.01, 0.59, 2.89, 1.77, 1.31, 1.66, 2.56, 28.16]} \ No newline at end of file diff --git a/annotations_filtered/wlwh5x9eHBM_filtered.json b/annotations_filtered/wlwh5x9eHBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3467fd30acb131f487ed5c99a26075a717280080 --- /dev/null +++ b/annotations_filtered/wlwh5x9eHBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.09], [2.0, 1.78], [3.0, 2.84], [6.0, 6.0], [15.0, 19.72], [20.0, 21.03], [23.0, 23.18], [27.0, 27.01], [29.0, 29.0], [32.0, 32.64], [34.0, 33.64], [34.0, 33.83], [36.0, 36.46], [40.0, 39.93], [45.0, 45.47], [47.0, 47.68], [50.0, 51.41], [60.0, 64.59], [67.0, 66.97], [68.0, 67.9], [68.0, 68.03], [68.0, 68.69], [73.0, 73.18], [75.0, 76.37], [79.0, 79.84], [80.0, 80.89], [82.0, 82.44], [91.0, 91.37], [93.0, 93.56], [101.0, 101.71], [103.0, 103.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.44], ["boing", 2.8], ["dog", 2.08]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, -0.22, -0.16, 0.0, 4.72, 1.03, 0.18, 0.01, 0.0, 0.64, -0.36, -0.17, 0.46, -0.07, 0.47, 0.68, 1.41, 4.59, -0.03, -0.1, 0.03, 0.69, 0.18, 1.37, 0.84, 0.89, 0.44, 0.37, 0.56, 0.71, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/wmFhHU38IhE_filtered.json b/annotations_filtered/wmFhHU38IhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..606a8d8ecc48694103a54f73ed1b361c7cbb477a --- /dev/null +++ b/annotations_filtered/wmFhHU38IhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [3.0, 2.71], [11.0, 15.28], [17.0, 21.54], [23.0, 24.33], [25.0, 26.23], [27.0, 27.08], [29.0, 28.73], [29.0, 29.0], [30.0, 30.91], [32.0, 33.47], [34.0, 34.5], [37.0, 39.36], [48.0, 49.35], [58.0, 60.71]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 33.37, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 45.33], "audiomae_on_audioset": [null, null, [["speech", 25.16], ["music", 14.11], ["hum", 10.26]], [["fly, housefly", 41.54], ["insect", 26.88], ["bee, wasp, etc.", 26.57]], null, null, null, null, null, null, null, null, [["fly, housefly", 42.09], ["insect", 14.23], ["bee, wasp, etc.", 9.79]], null, [["whale vocalization", 45.06], ["hum", 18.26], ["throbbing", 6.01]]], "duration": [0.67, -0.29, 4.28, 4.54, 1.33, 1.23, 0.08, -0.27, 0.0, 0.91, 1.47, 0.5, 2.36, 1.35, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/wmG3O9RvEaU_filtered.json b/annotations_filtered/wmG3O9RvEaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffb5d94b5735c696c53ca68ae3441983e435e494 --- /dev/null +++ b/annotations_filtered/wmG3O9RvEaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 29.37], [31.0, 30.96], [32.0, 32.88], [36.0, 37.49], [38.0, 39.09], [40.0, 43.48], [46.0, 48.15], [49.0, 51.26], [52.0, 52.24], [55.0, 63.81], [65.0, 65.42], [66.0, 66.99], [68.0, 68.3], [69.0, 70.38], [73.0, 75.32], [77.0, 77.7], [79.0, 83.37], [84.0, 86.44], [87.0, 98.36], [99.0, 101.51], [103.0, 102.86], [104.0, 105.43], [106.0, 107.28], [108.0, 114.24], [117.0, 117.86], [118.0, 119.31], [121.0, 121.56]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [37.5, 0.0, 0.0, 0.0, 0.0, 38.67, 50.61, 51.12, 0.0, 39.52, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 48.78, 81.53, 75.23, 81.53, 0.0, 0.0, 0.0, 34.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["rowboat, canoe, kayak", 13.93], ["radio", 12.53], ["boat, water vehicle", 10.91]], null, null, null, null, [["speech", 61.68], ["rowboat, canoe, kayak", 8.47], ["boat, water vehicle", 3.78]], null, null, null, [["animal", 24.08], ["rodents, rats, mice", 11.26], ["mouse", 6.84]], null, null, null, null, null, null, [["speech", 56.53], ["bee, wasp, etc.", 3.43], ["animal", 2.77]], null, null, null, null, null, null, [["firecracker", 24.09], ["burst, pop", 22.71], ["speech", 19.37]], null, null, null], "duration": [14.37, -0.04, 0.88, 1.49, 1.09, 3.48, 2.15, 2.26, 0.24, 8.81, 0.42, 0.99, 0.3, 1.38, 2.32, 0.7, 4.37, 2.44, 11.36, 2.51, -0.14, 1.43, 1.28, 6.24, 0.86, 1.31, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/wmXFSQdF3PM_filtered.json b/annotations_filtered/wmXFSQdF3PM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2acc59a8607edf2879b812683ff209d854e19ae6 --- /dev/null +++ b/annotations_filtered/wmXFSQdF3PM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.1], [8.0, 7.55], [11.0, 12.88], [15.0, 15.01], [17.0, 18.13], [21.0, 21.91], [24.0, 81.95], [83.0, 82.98], [84.0, 102.17], [104.0, 122.86], [123.0, 124.44], [126.0, 140.76], [142.0, 142.75], [146.0, 146.92], [148.0, 148.14], [150.0, 150.96], [152.0, 152.58], [153.0, 155.29], [157.0, 156.76], [158.0, 164.88], [167.0, 167.39]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43, 30.33, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 33.5, 0.0, 35.28, 0.0], "audiomae_on_audioset": [[["fire", 21.1], ["speech", 15.95], ["eruption", 5.63]], null, null, null, null, null, null, null, [["music", 73.07], ["hum", 6.16], ["scary music", 3.01]], [["music", 35.4], ["hum", 13.75], ["speech", 11.42]], null, [["music", 47.58], ["hum", 19.92], ["throbbing", 14.27]], null, null, null, null, null, [["music", 41.17], ["speech", 25.49], ["didgeridoo", 6.32]], null, [["hum", 39.5], ["sidetone", 12.72], ["speech", 9.75]], null], "duration": [2.1, -0.45, 1.88, 0.01, 1.13, 0.91, 57.95, -0.02, 18.17, 18.86, 1.44, 14.76, 0.75, 0.92, 0.14, 0.96, 0.58, 2.29, -0.24, 6.88, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/wmbN_BXQaho_filtered.json b/annotations_filtered/wmbN_BXQaho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67c8c95d471065e9a5164eb90736e296fd18a509 --- /dev/null +++ b/annotations_filtered/wmbN_BXQaho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.34], [6.0, 7.47], [8.0, 8.19], [11.0, 13.78], [16.0, 16.46], [17.0, 16.8], [18.0, 19.18], [19.0, 21.69], [23.0, 24.34], [25.0, 26.59], [28.0, 28.11], [29.0, 29.1], [30.0, 33.3], [35.0, 50.65], [51.0, 50.7], [51.0, 73.67], [77.0, 81.33], [82.0, 113.97], [119.0, 137.52], [140.0, 140.9], [143.0, 145.79], [147.0, 149.39], [154.0, 154.6], [156.0, 156.61], [158.0, 158.23], [159.0, 160.1], [163.0, 164.08], [166.0, 167.59], [169.0, 175.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.76, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 73.21, 33.62, 0.0, 33.63, 34.73, 0.0, 37.08, 0.0, 61.97, 70.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.86], ["speech", 17.1], ["fart", 12.38]], null, [["hum", 25.31], ["speech", 15.24], ["sidetone", 8.41]], [["music", 45.13], ["didgeridoo", 7.73], ["musical instrument", 4.52]], null, [["noise", 27.12], ["hum", 17.77], ["mains hum", 11.19]], null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 1.47, 0.19, 2.78, 0.46, -0.2, 1.18, 2.69, 1.34, 1.59, 0.11, 0.1, 3.3, 15.65, -0.3, 22.67, 4.33, 31.97, 18.52, 0.9, 2.79, 2.39, 0.6, 0.61, 0.23, 1.1, 1.08, 1.59, 6.63]} \ No newline at end of file diff --git a/annotations_filtered/wmbt1RjPn4M_filtered.json b/annotations_filtered/wmbt1RjPn4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wmbt1RjPn4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wmu9xg12xuc_filtered.json b/annotations_filtered/wmu9xg12xuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..433b38f187b6c8612ddadf117aa03c68e31533af --- /dev/null +++ b/annotations_filtered/wmu9xg12xuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.77], [18.0, 26.67], [28.0, 38.57], [41.0, 43.71], [45.0, 48.98], [51.0, 51.63], [56.0, 55.83], [56.0, 58.63], [62.0, 61.59], [64.0, 74.12], [76.0, 81.41], [83.0, 87.81], [91.0, 92.42], [94.0, 96.26], [96.0, 101.95], [106.0, 110.46]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, true, false, true, false, true], "silence_prob": [37.58, 32.81, 29.12, 29.84, 30.18, 0.0, 0.0, 30.73, 0.0, 29.83, 29.58, 28.95, 0.0, 29.8, 30.27, 28.78], "audiomae_on_audioset": [[["music", 34.14], ["hum", 9.88], ["mains hum", 5.39]], [["speech", 26.07], ["throbbing", 25.78], ["music", 25.3]], [["music", 39.19], ["speech", 22.09], ["vehicle", 4.68]], [["speech", 48.97], ["music", 22.7], ["hum", 4.2]], [["hum", 47.99], ["mains hum", 20.78], ["music", 11.5]], null, null, [["music", 19.49], ["throbbing", 14.93], ["hum", 10.54]], null, [["throbbing", 44.44], ["music", 44.25], ["hum", 5.07]], [["music", 44.19], ["speech", 30.03], ["throbbing", 11.1]], [["music", 40.14], ["speech", 10.37], ["noise", 6.13]], null, [["music", 30.94], ["angry music", 9.29], ["brass instrument", 4.82]], [["throbbing", 66.38], ["music", 13.09], ["hum", 11.29]], [["music", 32.43], ["smash, crash", 17.5], ["throbbing", 15.52]]], "duration": [2.77, 8.67, 10.57, 2.71, 3.98, 0.63, -0.17, 2.63, -0.41, 10.12, 5.41, 4.81, 1.42, 2.26, 5.95, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/wn-e7FlYRJU_filtered.json b/annotations_filtered/wn-e7FlYRJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6d5e8c61c01e9b6b7b64d8091a867ad1943ca2d --- /dev/null +++ b/annotations_filtered/wn-e7FlYRJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.13], [27.0, 27.65], [50.0, 52.05], [54.0, 53.87], [55.0, 55.85], [62.0, 63.04], [65.0, 65.47], [80.0, 81.58], [84.0, 85.11], [98.0, 98.34], [103.0, 103.62], [106.0, 107.16], [117.0, 116.92], [119.0, 119.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.65, 2.05, -0.13, 0.85, 1.04, 0.47, 1.58, 1.11, 0.34, 0.62, 1.16, -0.08, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/wn_8YBvVugo_filtered.json b/annotations_filtered/wn_8YBvVugo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1e0a726fc4fc4fd7ff9a0223447c2a53b0c47c2 --- /dev/null +++ b/annotations_filtered/wn_8YBvVugo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 32.95], [34.0, 34.89], [37.0, 78.16], [80.0, 80.25], [83.0, 83.15], [85.0, 84.86], [95.0, 99.57], [100.0, 100.55], [102.0, 105.04]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [31.26, 0.0, 0.0, 0.0, 0.0, 0.0, 34.03, 0.0, 36.46], "audiomae_on_audioset": [[["music", 27.25], ["speech", 16.15], ["throbbing", 7.84]], null, null, null, null, null, [["music", 59.79], ["throbbing", 19.47], ["hum", 12.09]], null, [["music", 37.23], ["speech", 10.74], ["synthesizer", 9.96]]], "duration": [11.95, 0.89, 41.16, 0.25, 0.15, -0.14, 4.57, 0.55, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/wnfHqnaM0yI_filtered.json b/annotations_filtered/wnfHqnaM0yI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b8a3bb85eccedbae69f7a191a96c4d6978b91a --- /dev/null +++ b/annotations_filtered/wnfHqnaM0yI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.72], [25.0, 25.66], [28.0, 28.83], [35.0, 35.07], [37.0, 38.21], [39.0, 49.57], [52.0, 52.47], [54.0, 56.32], [58.0, 59.22], [72.0, 76.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.85, 0.0, 30.65, 0.0, 37.74], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 38.86], ["cattle, bovinae", 16.81], ["music", 15.72]], null, [["music", 30.71], ["whack, thwack", 29.46], ["thunk", 14.42]], null, [["music", 35.95], ["musical instrument", 11.59], ["guitar", 10.87]]], "duration": [0.72, 0.66, 0.83, 0.07, 1.21, 10.57, 0.47, 2.32, 1.22, 4.54]} \ No newline at end of file diff --git a/annotations_filtered/wnrdetFAo1o_filtered.json b/annotations_filtered/wnrdetFAo1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db9e5385bd15b7a35bd5b0ef3ab0d6872feeeb7d --- /dev/null +++ b/annotations_filtered/wnrdetFAo1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.71], [8.0, 9.56], [10.0, 11.89], [15.0, 15.33], [17.0, 17.88], [33.0, 33.35], [38.0, 39.06], [51.0, 50.85], [52.0, 53.82], [57.0, 58.46], [59.0, 60.44], [61.0, 64.44], [65.0, 64.93], [66.0, 68.18], [69.0, 69.99], [71.0, 73.43], [74.0, 76.37], [78.0, 78.9], [80.0, 82.0], [83.0, 84.69], [86.0, 87.56], [89.0, 89.45], [90.0, 92.62], [96.0, 97.61], [98.0, 99.49], [101.0, 102.27], [104.0, 112.24], [114.0, 118.59], [119.0, 120.88], [122.0, 127.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 69.47, 0.0, 87.74, 34.46, 0.0, 71.0, 0.0, 0.0, 0.0, 34.11, 0.0, 0.0, 0.0, 47.86, 92.15, 0.0, 90.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.14], ["inside, small room", 3.39], ["fart", 2.78]], null, null, null, null, null, [["dog", 15.91], ["speech", 11.49], ["domestic animals, pets", 8.28]], null, null, null, [["hum", 28.83], ["speech", 11.94], ["mains hum", 5.81]], null, null, null], "duration": [1.71, 1.56, 1.89, 0.33, 0.88, 0.35, 1.06, -0.15, 1.82, 1.46, 1.44, 3.44, -0.07, 2.18, 0.99, 2.43, 2.37, 0.9, 2.0, 1.69, 1.56, 0.45, 2.62, 1.61, 1.49, 1.27, 8.24, 4.59, 1.88, 5.33]} \ No newline at end of file diff --git a/annotations_filtered/wnvRIdndQdk_filtered.json b/annotations_filtered/wnvRIdndQdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71ff9719eb06cada80dce99f9313826cf2e96317 --- /dev/null +++ b/annotations_filtered/wnvRIdndQdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.75], [9.0, 17.42], [19.0, 23.57], [24.0, 49.72], [50.0, 49.94], [50.0, 50.52], [53.0, 72.87], [75.0, 97.39], [102.0, 116.67]], "keep_status": [false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 39.46, 52.98, 30.6, 0.0, 0.0, 29.67, 30.32, 29.07], "audiomae_on_audioset": [null, [["didgeridoo", 53.44], ["music", 26.74], ["whale vocalization", 4.51]], null, [["whale vocalization", 16.24], ["hum", 15.0], ["throbbing", 11.43]], null, null, [["music", 55.1], ["throbbing", 10.18], ["outside, rural or natural", 2.88]], [["music", 43.45], ["hum", 22.09], ["mains hum", 9.97]], [["hum", 31.59], ["music", 29.5], ["throbbing", 17.4]]], "duration": [1.75, 8.42, 4.57, 25.72, -0.06, 0.52, 19.87, 22.39, 14.67]} \ No newline at end of file diff --git a/annotations_filtered/wnwsSOrmEKI_filtered.json b/annotations_filtered/wnwsSOrmEKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..995c37ded454e1ff0fce3a1885833944bcf464da --- /dev/null +++ b/annotations_filtered/wnwsSOrmEKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 27.48], [28.0, 39.39], [43.0, 44.61], [45.0, 45.35], [45.0, 48.51], [51.0, 53.7], [55.0, 59.7], [66.0, 66.38], [73.0, 73.7], [77.0, 78.76], [79.0, 82.65], [83.0, 84.96], [89.0, 89.92], [90.0, 90.56], [92.0, 91.64], [93.0, 93.21], [99.0, 99.05], [105.0, 105.46], [108.0, 111.37], [114.0, 114.86], [117.0, 126.87], [128.0, 133.27], [136.0, 154.48]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.48, 36.71, 0.0, 0.0, 44.78, 49.82, 64.41, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.61, 0.0, 45.78, 100.0, 85.9], "audiomae_on_audioset": [null, [["speech", 56.65], ["sidetone", 34.42], ["dial tone", 1.41]], null, null, [["speech", 16.93], ["hum", 11.9], ["whale vocalization", 10.14]], [["burping, eructation", 22.88], ["hum", 14.7], ["speech", 8.13]], null, null, null, null, [["fart", 23.22], ["grunt", 13.89], ["growling", 6.55]], null, null, null, null, null, null, null, null, null, [["speech", 83.42], ["grunt", 10.12], ["male speech, man speaking", 2.4]], null, null], "duration": [21.48, 11.39, 1.61, 0.35, 3.51, 2.7, 4.7, 0.38, 0.7, 1.76, 3.65, 1.96, 0.92, 0.56, -0.36, 0.21, 0.05, 0.46, 3.37, 0.86, 9.87, 5.27, 18.48]} \ No newline at end of file diff --git a/annotations_filtered/woLbaFLoJI8_filtered.json b/annotations_filtered/woLbaFLoJI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e85ce63c46d49c1b3239ca1964932ce6af20650 --- /dev/null +++ b/annotations_filtered/woLbaFLoJI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [3.0, 5.14], [6.0, 7.08], [10.0, 11.8], [14.0, 15.03], [16.0, 17.56], [19.0, 19.2], [20.0, 21.41], [23.0, 24.61], [30.0, 30.11], [41.0, 59.41], [63.0, 64.18], [67.0, 68.64], [82.0, 91.94], [93.0, 94.53], [95.0, 95.47], [100.0, 102.64], [113.0, 114.49], [116.0, 119.25], [120.0, 120.48], [121.0, 126.66], [127.0, 129.14], [130.0, 136.61], [138.0, 139.04], [140.0, 140.09], [142.0, 143.13], [145.0, 146.21], [147.0, 147.61], [151.0, 152.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 48.95, 0.0, 0.0, 60.05, 0.0, 72.01, 0.0, 83.16, 99.26, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 31.33], ["speech", 14.69], ["music", 14.21]], null, null, null, null, null, null, null, null, [["music", 48.62], ["speech", 17.93], ["hum", 11.06]], null, null, [["speech", 43.62], ["music", 20.59], ["insect", 3.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 2.14, 1.08, 1.8, 1.03, 1.56, 0.2, 1.41, 1.61, 0.11, 18.41, 1.18, 1.64, 9.94, 1.53, 0.47, 2.64, 1.49, 3.25, 0.48, 5.66, 2.14, 6.61, 1.04, 0.09, 1.13, 1.21, 0.61, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/woSj0M9Decw_filtered.json b/annotations_filtered/woSj0M9Decw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1934d05aa37088690737fb047b33095834ebffb --- /dev/null +++ b/annotations_filtered/woSj0M9Decw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.67], [15.0, 17.74], [20.0, 30.69], [32.0, 40.59], [42.0, 42.01], [42.0, 48.42], [54.0, 55.53], [57.0, 57.72], [59.0, 59.22], [64.0, 64.5], [69.0, 69.01], [71.0, 89.38], [91.0, 101.83], [104.0, 106.2]], "keep_status": [false, true, true, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [29.61, 32.32, 30.27, 30.65, 0.0, 29.66, 0.0, 0.0, 0.0, 0.0, 0.0, 30.14, 30.65, 30.07], "audiomae_on_audioset": [[["music", 47.41], ["didgeridoo", 24.42], ["whale vocalization", 7.24]], [["music", 25.11], ["throbbing", 17.58], ["livestock, farm animals, working animals", 13.55]], [["music", 54.81], ["musical instrument", 5.52], ["speech", 4.62]], [["livestock, farm animals, working animals", 31.93], ["cattle, bovinae", 19.66], ["music", 15.58]], null, [["moo", 19.11], ["cattle, bovinae", 19.09], ["speech", 15.94]], null, null, null, null, null, [["theremin", 38.39], ["music", 38.17], ["synthesizer", 4.33]], [["music", 63.87], ["synthesizer", 16.02], ["theremin", 3.6]], [["speech", 29.15], ["sidetone", 10.17], ["music", 10.07]]], "duration": [7.67, 2.74, 10.69, 8.59, 0.01, 6.42, 1.53, 0.72, 0.22, 0.5, 0.01, 18.38, 10.83, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/worFlbNJG_w_filtered.json b/annotations_filtered/worFlbNJG_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d5a5e6880d31cc7b067bc2003464fe8153652bc --- /dev/null +++ b/annotations_filtered/worFlbNJG_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.35], [19.0, 22.23], [24.0, 25.0], [26.0, 27.46], [30.0, 31.63], [35.0, 39.28], [40.0, 43.07], [44.0, 44.02], [46.0, 46.18], [50.0, 50.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 88.83, 0.0, 0.0, 0.0, 100.0, 36.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 71.19], ["busy signal", 6.52], ["dial tone", 3.62]], null, null, null], "duration": [3.35, 3.23, 1.0, 1.46, 1.63, 4.28, 3.07, 0.02, 0.18, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/wosztGGnWt4_filtered.json b/annotations_filtered/wosztGGnWt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bd0a109322293ee73cd481c21c76eff2cc6dda5 --- /dev/null +++ b/annotations_filtered/wosztGGnWt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.13], [9.0, 10.64], [12.0, 12.29], [14.0, 17.59], [20.0, 20.6], [22.0, 21.95], [30.0, 31.28], [33.0, 33.13], [36.0, 36.44], [37.0, 38.52], [43.0, 44.1], [47.0, 48.15], [49.0, 49.42], [58.0, 62.46], [65.0, 66.16], [69.0, 70.71], [73.0, 73.53], [74.0, 74.75], [77.0, 77.6], [79.0, 84.1], [93.0, 94.63], [99.0, 99.99], [103.0, 104.97], [108.0, 109.46], [112.0, 113.68], [117.0, 122.5], [124.0, 125.51], [128.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.11, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.13, 1.64, 0.29, 3.59, 0.6, -0.05, 1.28, 0.13, 0.44, 1.52, 1.1, 1.15, 0.42, 4.46, 1.16, 1.71, 0.53, 0.75, 0.6, 5.1, 1.63, 0.99, 1.97, 1.46, 1.68, 5.5, 1.51, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/wowXQ9ZrN1w_filtered.json b/annotations_filtered/wowXQ9ZrN1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aba92f49f42fe2e180d0280f28b455f69926b2a2 --- /dev/null +++ b/annotations_filtered/wowXQ9ZrN1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.96], [39.0, 39.77], [41.0, 44.58], [45.0, 60.83], [62.0, 66.14], [68.0, 69.65], [71.0, 70.68], [71.0, 72.72], [73.0, 72.94], [73.0, 76.72], [84.0, 89.41], [96.0, 96.92], [102.0, 105.78], [108.0, 108.23], [110.0, 110.44]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 76.04, 44.23, 57.72, 0.0, 0.0, 0.0, 0.0, 41.07, 33.96, 0.0, 34.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.97], ["speech", 8.99], ["musical instrument", 1.64]], null, null, null, null, null, [["music", 55.97], ["electric shaver, electric razor", 9.86], ["mains hum", 5.41]], [["noise", 23.44], ["mains hum", 13.59], ["music", 12.79]], null, [["music", 29.0], ["mains hum", 25.68], ["hum", 10.45]], null, null], "duration": [1.96, 0.77, 3.58, 15.83, 4.14, 1.65, -0.32, 1.72, -0.06, 3.72, 5.41, 0.92, 3.78, 0.23, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/wp4tgWYqjyw_filtered.json b/annotations_filtered/wp4tgWYqjyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..128d4257b7e32927d2d8787e50e351da699bb198 --- /dev/null +++ b/annotations_filtered/wp4tgWYqjyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.4], [26.0, 26.7], [39.0, 38.99]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.4, 0.7, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/wpQ4R1jlFHs_filtered.json b/annotations_filtered/wpQ4R1jlFHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bc67522bfbf640a6e092ea1557875b73191b07c --- /dev/null +++ b/annotations_filtered/wpQ4R1jlFHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.09], [21.0, 21.91], [23.0, 23.6], [26.0, 31.75], [33.0, 33.56], [35.0, 38.2], [39.0, 41.28], [43.0, 43.09], [44.0, 46.25], [47.0, 49.69], [52.0, 53.59], [59.0, 59.39], [65.0, 67.31], [68.0, 68.62], [72.0, 72.05], [80.0, 80.05], [82.0, 81.87], [84.0, 87.25], [94.0, 94.69], [102.0, 102.3], [104.0, 104.4], [106.0, 106.79], [110.0, 110.54], [111.0, 112.24], [114.0, 116.09], [120.0, 120.5], [122.0, 122.79], [123.0, 123.85], [133.0, 134.33], [137.0, 137.3], [140.0, 141.18], [144.0, 144.34], [146.0, 146.74], [148.0, 148.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.82, 0.0, 99.52, 65.79, 0.0, 40.68, 30.11, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 74.49], ["telephone", 8.42], ["dial tone", 8.3]], null, null, null, null, [["speech", 52.59], ["sidetone", 23.0], ["busy signal", 5.5]], [["speech", 36.98], ["music", 14.06], ["smash, crash", 6.22]], null, null, null, null, null, null, null, [["speech", 40.01], ["fart", 5.35], ["bee, wasp, etc.", 2.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.91, 0.6, 5.75, 0.56, 3.2, 2.28, 0.09, 2.25, 2.69, 1.59, 0.39, 2.31, 0.62, 0.05, 0.05, -0.13, 3.25, 0.69, 0.3, 0.4, 0.79, 0.54, 1.24, 2.09, 0.5, 0.79, 0.85, 1.33, 0.3, 1.18, 0.34, 0.74, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/wpci2WuWy4E_filtered.json b/annotations_filtered/wpci2WuWy4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22eee6e6d91c2de7d61c17ca85d08faaad3389f4 --- /dev/null +++ b/annotations_filtered/wpci2WuWy4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.27], [12.0, 14.52], [17.0, 17.24], [18.0, 19.35], [23.0, 24.68], [26.0, 26.72], [30.0, 29.66], [31.0, 31.73], [32.0, 33.44], [34.0, 64.29], [64.0, 78.87], [81.0, 81.68], [82.0, 105.29], [111.0, 115.52], [116.0, 121.56], [123.0, 127.58], [128.0, 128.85], [131.0, 136.8], [141.0, 141.51], [142.0, 143.7], [144.0, 153.05], [154.0, 155.46], [159.0, 159.29], [161.0, 161.33], [164.0, 163.95], [165.0, 168.15], [172.0, 173.33], [175.0, 175.88], [176.0, 190.51], [193.0, 195.86], [199.0, 220.35], [223.0, 224.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, true, true, false, false], "silence_prob": [34.52, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.11, 0.0, 30.9, 30.25, 31.33, 30.72, 0.0, 29.8, 0.0, 0.0, 29.35, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 29.98, 39.37, 63.64, 0.0], "audiomae_on_audioset": [[["mains hum", 34.62], ["hum", 34.53], ["sidetone", 6.51]], null, null, null, null, null, null, null, null, null, [["music", 85.86], ["hum", 4.32], ["throbbing", 2.03]], null, [["music", 63.02], ["throbbing", 4.1], ["hum", 3.68]], [["music", 71.04], ["didgeridoo", 13.53], ["musical instrument", 2.67]], [["music", 75.94], ["synthesizer", 5.02], ["musical instrument", 2.99]], [["music", 51.16], ["didgeridoo", 14.48], ["speech", 9.1]], null, [["music", 24.89], ["noise", 24.51], ["mains hum", 7.17]], null, null, [["music", 47.24], ["hum", 9.69], ["throbbing", 7.97]], null, null, null, null, [["music", 30.14], ["hum", 12.07], ["throbbing", 8.22]], null, null, [["speech", 28.97], ["music", 9.69], ["hum", 7.84]], [["frog", 9.48], ["whale vocalization", 5.62], ["music", 4.88]], null, null], "duration": [7.27, 2.52, 0.24, 1.35, 1.68, 0.72, -0.34, 0.73, 1.44, 30.29, 14.87, 0.68, 23.29, 4.52, 5.56, 4.58, 0.85, 5.8, 0.51, 1.7, 9.05, 1.46, 0.29, 0.33, -0.05, 3.15, 1.33, 0.88, 14.51, 2.86, 21.35, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/wpxS1xSxUDY_filtered.json b/annotations_filtered/wpxS1xSxUDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aaa3ceaa206839d422716c4dffda5d03c6ba728 --- /dev/null +++ b/annotations_filtered/wpxS1xSxUDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 3.75], [8.0, 11.23], [13.0, 14.5], [16.0, 17.2], [18.0, 18.87], [21.0, 21.98], [24.0, 24.93], [26.0, 26.42], [30.0, 29.74], [31.0, 32.36], [34.0, 83.49], [86.0, 86.34], [93.0, 94.64], [96.0, 97.9], [98.0, 99.96], [102.0, 102.88], [106.0, 106.84], [109.0, 109.19], [113.0, 114.0], [119.0, 120.8], [123.0, 124.17], [126.0, 127.2], [128.0, 129.25], [131.0, 132.04], [134.0, 154.57], [161.0, 161.15], [161.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.73, 0.0, 41.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.62], ["mains hum", 21.05], ["throbbing", 10.62]], null, [["music", 60.93], ["electronic music", 3.26], ["synthesizer", 3.05]]], "duration": [0.73, 0.75, 3.23, 1.5, 1.2, 0.87, 0.98, 0.93, 0.42, -0.26, 1.36, 49.49, 0.34, 1.64, 1.9, 1.96, 0.88, 0.84, 0.19, 1.0, 1.8, 1.17, 1.2, 1.25, 1.04, 20.57, 0.15, 3.94]} \ No newline at end of file diff --git a/annotations_filtered/wq26A_QK4So_filtered.json b/annotations_filtered/wq26A_QK4So_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78f23df616a13f900562dd447f114ea3a25a3167 --- /dev/null +++ b/annotations_filtered/wq26A_QK4So_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 5.17], [6.0, 6.29], [7.0, 9.07], [12.0, 13.46], [16.0, 19.72], [24.0, 25.37], [28.0, 30.23], [33.0, 33.98], [36.0, 37.66], [40.0, 41.01], [43.0, 43.28], [45.0, 45.39], [46.0, 46.41], [47.0, 47.49], [49.0, 49.17], [51.0, 53.16], [54.0, 56.37], [59.0, 59.22], [60.0, 60.35], [61.0, 61.86], [62.0, 67.37], [70.0, 71.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.59, 0.0, 83.34, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 63.21, 0.0, 0.0, 0.0, 67.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.17, 0.29, 2.07, 1.46, 3.72, 1.37, 2.23, 0.98, 1.66, 1.01, 0.28, 0.39, 0.41, 0.49, 0.17, 2.16, 2.37, 0.22, 0.35, 0.86, 5.37, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/wq3EAVEnW8Q_filtered.json b/annotations_filtered/wq3EAVEnW8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d20703c3422ab13b6026f143e22987962c803c79 --- /dev/null +++ b/annotations_filtered/wq3EAVEnW8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.31], [16.0, 19.82], [31.0, 31.62], [33.0, 33.81], [42.0, 42.6], [44.0, 46.26], [47.0, 46.82], [48.0, 49.13]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.34, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 14.9], ["sound effect", 8.21], ["buzz", 6.36]], null, null, null, null, null, null], "duration": [0.31, 3.82, 0.62, 0.81, 0.6, 2.26, -0.18, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/wqMPRiWvJEs_filtered.json b/annotations_filtered/wqMPRiWvJEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af821e0ba17cb781acaa238af099ea8848f22184 --- /dev/null +++ b/annotations_filtered/wqMPRiWvJEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.96], [18.0, 19.04], [22.0, 26.06], [30.0, 44.31], [47.0, 47.33], [51.0, 54.51], [58.0, 58.53], [65.0, 65.25], [72.0, 74.87], [79.0, 79.39], [87.0, 87.88], [94.0, 94.78], [95.0, 96.01], [96.0, 105.17], [110.0, 111.38], [113.0, 114.03], [115.0, 124.44], [126.0, 130.6], [134.0, 139.94], [145.0, 145.61], [147.0, 152.88], [156.0, 157.65], [158.0, 159.14], [162.0, 167.1]], "keep_status": [true, false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [29.87, 0.0, 32.47, 32.69, 0.0, 31.25, 0.0, 0.0, 42.06, 0.0, 0.0, 0.0, 0.0, 31.44, 0.0, 0.0, 30.78, 30.72, 36.06, 0.0, 33.55, 0.0, 0.0, 34.79], "audiomae_on_audioset": [[["music", 59.43], ["didgeridoo", 3.23], ["explosion", 3.13]], null, [["music", 41.44], ["speech", 21.78], ["throbbing", 4.85]], [["music", 32.12], ["throbbing", 25.08], ["hum", 12.59]], null, [["mains hum", 28.37], ["hum", 22.97], ["music", 13.04]], null, null, [["music", 37.61], ["theremin", 21.27], ["whale vocalization", 3.99]], null, null, null, null, [["music", 41.99], ["speech", 29.99], ["animal", 3.31]], null, null, [["music", 55.71], ["speech", 13.36], ["didgeridoo", 2.77]], [["cattle, bovinae", 44.33], ["moo", 27.49], ["livestock, farm animals, working animals", 15.58]], [["throbbing", 30.73], ["hum", 29.91], ["mains hum", 13.43]], null, [["boing", 23.67], ["music", 22.42], ["speech", 18.51]], null, null, [["speech", 35.33], ["music", 16.29], ["hum", 13.53]]], "duration": [14.96, 1.04, 4.06, 14.31, 0.33, 3.51, 0.53, 0.25, 2.87, 0.39, 0.88, 0.78, 1.01, 9.17, 1.38, 1.03, 9.44, 4.6, 5.94, 0.61, 5.88, 1.65, 1.14, 5.1]} \ No newline at end of file diff --git a/annotations_filtered/wqj7Q2jOTc4_filtered.json b/annotations_filtered/wqj7Q2jOTc4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c536efbbdaed0ec1d13b48dbfe37788750920c21 --- /dev/null +++ b/annotations_filtered/wqj7Q2jOTc4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.93], [17.0, 18.17], [19.0, 23.19], [27.0, 27.85], [29.0, 30.84], [32.0, 33.49], [34.0, 35.7], [37.0, 40.59], [42.0, 42.89], [44.0, 46.85]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [52.39, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 51.23, 0.0, 37.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 36.94], ["sine wave", 8.48], ["whale vocalization", 7.25]]], "duration": [2.93, 1.17, 4.19, 0.85, 1.84, 1.49, 1.7, 3.59, 0.89, 2.85]} \ No newline at end of file diff --git a/annotations_filtered/wqwUdp5-2D8_filtered.json b/annotations_filtered/wqwUdp5-2D8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce96859d2864c31834c2513ef3692c6258d1109f --- /dev/null +++ b/annotations_filtered/wqwUdp5-2D8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.84], [23.0, 23.06], [26.0, 27.48], [29.0, 29.27], [34.0, 37.39], [55.0, 55.43], [72.0, 72.79], [80.0, 81.5], [103.0, 103.08]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 46.92], ["music", 9.45], ["sidetone", 9.0]], null, null, null, null], "duration": [1.84, 0.06, 1.48, 0.27, 3.39, 0.43, 0.79, 1.5, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/wr4rZEPQ09Y_filtered.json b/annotations_filtered/wr4rZEPQ09Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e368f1b2c0103aa222b369e12050e7fe7a82441 --- /dev/null +++ b/annotations_filtered/wr4rZEPQ09Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.08], [20.0, 35.72], [37.0, 39.48], [40.0, 43.41], [45.0, 54.57], [55.0, 58.5], [60.0, 108.24], [109.0, 109.88]], "keep_status": [false, false, false, false, true, true, false, false], "silence_prob": [36.22, 31.25, 51.5, 51.07, 36.05, 44.75, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.0], ["throbbing", 15.55], ["speech", 3.37]], [["music", 34.77], ["hum", 31.22], ["mains hum", 10.95]], null, null, [["music", 44.29], ["speech", 15.31], ["hum", 5.21]], [["music", 40.33], ["speech", 13.73], ["theremin", 4.79]], null, null], "duration": [16.08, 15.72, 2.48, 3.41, 9.57, 3.5, 48.24, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/wr5-v7rYg70_filtered.json b/annotations_filtered/wr5-v7rYg70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c691428761c724f3eabdeaed7776db6fa85193ba --- /dev/null +++ b/annotations_filtered/wr5-v7rYg70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.99], [12.0, 13.22], [29.0, 30.0], [32.0, 32.54], [41.0, 41.54], [58.0, 58.36], [60.0, 70.5], [97.0, 97.73], [102.0, 104.28], [116.0, 116.26], [117.0, 119.45], [120.0, 121.39], [122.0, 126.0], [127.0, 130.42], [131.0, 132.14], [133.0, 134.01]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 31.24, 0.0, 40.62, 0.0, 100.0, 38.23, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.73], ["guitar", 14.82], ["musical instrument", 12.39]], null, null, null, null, null, [["music", 40.22], ["wind instrument, woodwind instrument", 13.27], ["musical instrument", 6.13]], null, [["music", 71.65], ["speech", 9.41], ["boing", 1.91]], null, [["speech", 38.55], ["knock", 9.26], ["whack, thwack", 7.25]], null, null, [["speech", 23.27], ["moo", 18.18], ["cattle, bovinae", 15.99]], null, null], "duration": [2.99, 1.22, 1.0, 0.54, 0.54, 0.36, 10.5, 0.73, 2.28, 0.26, 2.45, 1.39, 4.0, 3.42, 1.14, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/wrO6W6vTjV0_filtered.json b/annotations_filtered/wrO6W6vTjV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..822d487bf9d1b5db26d65b548d919d915fd8284c --- /dev/null +++ b/annotations_filtered/wrO6W6vTjV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 85.78], [89.0, 132.95], [134.0, 144.93]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 96.66], "audiomae_on_audioset": [null, null, null], "duration": [44.78, 43.95, 10.93]} \ No newline at end of file diff --git a/annotations_filtered/wrYcEEv737c_filtered.json b/annotations_filtered/wrYcEEv737c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af838e708a61f637315e24cd5b32eb9196a4cb83 --- /dev/null +++ b/annotations_filtered/wrYcEEv737c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [3.0, 3.69], [5.0, 5.83], [16.0, 20.49], [22.0, 22.76], [24.0, 24.78], [34.0, 61.11], [64.0, 82.34], [85.0, 90.81], [91.0, 91.69], [104.0, 106.71], [109.0, 111.96], [113.0, 113.95], [115.0, 115.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 59.07, 33.87, 63.21, 0.0, 34.01, 39.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 70.47], ["theremin", 4.67], ["synthesizer", 3.08]], null, null, [["theremin", 46.86], ["music", 33.53], ["musical instrument", 2.01]], [["music", 55.95], ["ambient music", 15.15], ["theremin", 7.59]], null, null], "duration": [0.85, 0.69, 0.83, 4.49, 0.76, 0.78, 27.11, 18.34, 5.81, 0.69, 2.71, 2.96, 0.95, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/wrkeOayCv6E_filtered.json b/annotations_filtered/wrkeOayCv6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8787aa1204d4c3acdab9eaae67d90fe0dc7e63e6 --- /dev/null +++ b/annotations_filtered/wrkeOayCv6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.62], [33.0, 42.62], [44.0, 45.18], [48.0, 67.85], [71.0, 73.47], [74.0, 74.61], [76.0, 80.47], [81.0, 82.21], [83.0, 94.88], [97.0, 98.41], [99.0, 103.13], [105.0, 115.94], [117.0, 118.67], [119.0, 119.4], [120.0, 120.73], [124.0, 125.24], [132.0, 135.13], [137.0, 138.6], [140.0, 140.27], [142.0, 149.99], [153.0, 153.15]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.37, 33.0, 0.0, 31.51, 53.78, 0.0, 47.98, 0.0, 36.94, 0.0, 33.73, 36.74, 0.0, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 36.11, 0.0], "audiomae_on_audioset": [[["music", 63.75], ["mains hum", 6.4], ["hum", 5.58]], [["buzz", 26.11], ["music", 21.62], ["speech", 18.31]], null, [["music", 23.82], ["hum", 14.83], ["throbbing", 8.07]], null, null, [["speech", 65.37], ["eruption", 4.16], ["gurgling", 2.66]], null, [["moo", 39.6], ["cattle, bovinae", 38.78], ["livestock, farm animals, working animals", 10.69]], null, [["shofar", 42.83], ["wind instrument, woodwind instrument", 28.64], ["music", 6.66]], [["quack", 44.43], ["duck", 22.18], ["music", 19.92]], null, null, null, null, null, null, null, [["quack", 44.08], ["duck", 16.59], ["music", 15.13]], null], "duration": [17.62, 9.62, 1.18, 19.85, 2.47, 0.61, 4.47, 1.21, 11.88, 1.41, 4.13, 10.94, 1.67, 0.4, 0.73, 1.24, 3.13, 1.6, 0.27, 7.99, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/wrmwJx6kYKc_filtered.json b/annotations_filtered/wrmwJx6kYKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1143cccab09d551e31336e4f7cab75e2e08eff --- /dev/null +++ b/annotations_filtered/wrmwJx6kYKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 165.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [146.69]} \ No newline at end of file diff --git a/annotations_filtered/wsFQrTAEs7A_filtered.json b/annotations_filtered/wsFQrTAEs7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dbad93da0efb0214529c3bb09aec8a9d0419245 --- /dev/null +++ b/annotations_filtered/wsFQrTAEs7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.88], [19.0, 20.01], [21.0, 22.57], [23.0, 24.06], [25.0, 28.88], [35.0, 35.33], [51.0, 54.35], [71.0, 75.1], [85.0, 89.99], [93.0, 101.8], [109.0, 108.89], [114.0, 114.83], [117.0, 117.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.82, 0.0, 0.0, 0.0, 41.05, 0.0, 33.3, 32.0, 32.33, 33.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.54], ["musical instrument", 11.42], ["brass instrument", 5.5]], null, null, null, [["music", 54.73], ["musical instrument", 14.65], ["speech", 5.08]], null, [["music", 59.21], ["speech", 9.53], ["didgeridoo", 3.3]], [["music", 53.02], ["theremin", 13.48], ["didgeridoo", 8.98]], [["music", 79.74], ["musical instrument", 5.21], ["synthesizer", 2.4]], [["theremin", 53.78], ["music", 41.66], ["musical instrument", 1.0]], null, null, null], "duration": [2.88, 1.01, 1.57, 1.06, 3.88, 0.33, 3.35, 4.1, 4.99, 8.8, -0.11, 0.83, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/wsIybRQaDE4_filtered.json b/annotations_filtered/wsIybRQaDE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59cd325c64deaba7cdfff997ef1604f03d6a25fa --- /dev/null +++ b/annotations_filtered/wsIybRQaDE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.79], [8.0, 38.03], [40.0, 40.69], [41.0, 52.69], [56.0, 60.03], [64.0, 66.77], [69.0, 69.28], [70.0, 77.23], [78.0, 81.95], [84.0, 90.34], [92.0, 91.88], [93.0, 95.22], [97.0, 107.38]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.62, 33.5, 39.5, 0.0, 58.89, 50.02, 44.93, 0.0, 57.97, 52.1], "audiomae_on_audioset": [null, null, null, [["music", 75.63], ["orchestra", 2.2], ["musical instrument", 2.04]], [["music", 58.15], ["theremin", 10.23], ["choir", 4.43]], [["music", 73.94], ["theremin", 5.45], ["ambient music", 4.29]], null, null, null, [["music", 39.67], ["whale vocalization", 10.45], ["gong", 8.55]], null, null, null], "duration": [0.79, 30.03, 0.69, 11.69, 4.03, 2.77, 0.28, 7.23, 3.95, 6.34, -0.12, 2.22, 10.38]} \ No newline at end of file diff --git a/annotations_filtered/wsQJVAzezrc_filtered.json b/annotations_filtered/wsQJVAzezrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e5566b043a0a9b3f2eca3123492c2ef26a6b356 --- /dev/null +++ b/annotations_filtered/wsQJVAzezrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.78], [7.0, 12.11], [12.0, 12.68], [13.0, 19.79], [28.0, 28.41], [30.0, 30.87], [40.0, 39.87]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 50.06, 0.0, 42.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 60.25], ["vehicle", 5.73], ["radio", 4.72]], null, null, null], "duration": [-0.22, 5.11, 0.68, 6.79, 0.41, 0.87, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/wsSlB31dwiE_filtered.json b/annotations_filtered/wsSlB31dwiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..847d2a4d9bad483355b571c3f374129ef1c58a72 --- /dev/null +++ b/annotations_filtered/wsSlB31dwiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [15.0, 15.63], [20.0, 22.22], [24.0, 25.19], [28.0, 29.37], [41.0, 43.28], [44.0, 83.69], [88.0, 105.39]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 81.53, 0.0, 0.0, 37.36, 0.0, 31.44], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 10.75], ["speech", 8.45], ["mains hum", 7.73]], null, [["speech", 81.84], ["fart", 4.21], ["explosion", 3.18]]], "duration": [0.84, 0.63, 2.22, 1.19, 1.37, 2.28, 39.69, 17.39]} \ No newline at end of file diff --git a/annotations_filtered/wsYNpHaKJIc_filtered.json b/annotations_filtered/wsYNpHaKJIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ee82d04f008f464444f3fd57efc001ba2c9cff1 --- /dev/null +++ b/annotations_filtered/wsYNpHaKJIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.13], [15.0, 16.39], [17.0, 23.48], [28.0, 40.71], [41.0, 42.28], [44.0, 44.32], [46.0, 46.95], [50.0, 51.71], [52.0, 52.41], [53.0, 57.28], [59.0, 61.21], [64.0, 74.66], [78.0, 77.84], [81.0, 81.9], [87.0, 91.08], [93.0, 93.65], [95.0, 96.25], [98.0, 102.07], [103.0, 103.94], [106.0, 108.53], [112.0, 112.38], [114.0, 114.71], [116.0, 117.91], [121.0, 122.82], [125.0, 131.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.07, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.93, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 1.39, 6.48, 12.71, 1.28, 0.32, 0.95, 1.71, 0.41, 4.28, 2.21, 10.66, -0.16, 0.9, 4.08, 0.65, 1.25, 4.07, 0.94, 2.53, 0.38, 0.71, 1.91, 1.82, 6.23]} \ No newline at end of file diff --git a/annotations_filtered/wsl5fS7KGZc_filtered.json b/annotations_filtered/wsl5fS7KGZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wsl5fS7KGZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wsooQlbj934_filtered.json b/annotations_filtered/wsooQlbj934_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fb0bed956a3c5065ad665cd849f1911dbdb769f --- /dev/null +++ b/annotations_filtered/wsooQlbj934_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.28], [19.0, 33.88], [41.0, 63.07], [64.0, 76.03], [78.0, 79.73], [82.0, 91.86], [94.0, 94.47], [96.0, 96.7], [99.0, 100.18], [101.0, 102.25], [104.0, 105.66], [109.0, 113.68], [118.0, 127.94], [129.0, 131.4], [134.0, 142.6], [144.0, 144.64], [145.0, 155.14], [156.0, 157.37], [160.0, 162.18], [163.0, 163.76], [165.0, 170.41], [171.0, 174.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, true, false, true, true], "silence_prob": [29.84, 58.72, 40.04, 34.49, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24, 31.79, 33.8, 37.28, 0.0, 36.9, 0.0, 41.32, 0.0, 39.33, 44.75], "audiomae_on_audioset": [[["hum", 33.68], ["music", 30.13], ["mains hum", 11.54]], null, [["hum", 50.93], ["mains hum", 24.82], ["throbbing", 8.56]], [["speech", 48.87], ["noise", 13.31], ["whack, thwack", 8.59]], null, [["hum", 50.05], ["mains hum", 23.39], ["buzz", 6.36]], null, null, null, null, null, [["speech", 37.21], ["whale vocalization", 31.2], ["sidetone", 6.48]], [["explosion", 22.2], ["speech", 15.55], ["burst, pop", 10.9]], [["whale vocalization", 44.81], ["livestock, farm animals, working animals", 9.23], ["cattle, bovinae", 6.5]], [["quack", 13.25], ["rumble", 13.08], ["duck", 11.7]], null, [["sidetone", 32.01], ["speech", 29.59], ["throbbing", 4.99]], null, [["whale vocalization", 11.87], ["hum", 11.1], ["rumble", 9.45]], null, [["speech", 30.73], ["hum", 17.59], ["music", 11.31]], [["gong", 26.56], ["music", 15.01], ["sonar", 7.22]]], "duration": [13.28, 14.88, 22.07, 12.03, 1.73, 9.86, 0.47, 0.7, 1.18, 1.25, 1.66, 4.68, 9.94, 2.4, 8.6, 0.64, 10.14, 1.37, 2.18, 0.76, 5.41, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/wt0_m5mUsbo_filtered.json b/annotations_filtered/wt0_m5mUsbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..136220d321d35fa147eed554aea1f88d644638df --- /dev/null +++ b/annotations_filtered/wt0_m5mUsbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [5.0, 6.08], [9.0, 11.08], [17.0, 16.8], [26.0, 27.85], [34.0, 35.24], [42.0, 43.39], [62.0, 64.07], [68.0, 68.79], [69.0, 70.02], [71.0, 71.93], [74.0, 73.68], [75.0, 75.73], [79.0, 80.77], [82.0, 82.53], [89.0, 94.47]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.56, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39], "audiomae_on_audioset": [null, null, [["mosquito", 28.19], ["fly, housefly", 19.38], ["moo", 10.5]], null, null, null, null, [["speech", 78.37], ["radio", 5.89], ["scratching (performance technique)", 3.57]], null, null, null, null, null, null, null, null], "duration": [1.1, 1.08, 2.08, -0.2, 1.85, 1.24, 1.39, 2.07, 0.79, 1.02, 0.93, -0.32, 0.73, 1.77, 0.53, 5.47]} \ No newline at end of file diff --git a/annotations_filtered/wt0klpk3tBA_filtered.json b/annotations_filtered/wt0klpk3tBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0477a58b77df3b653185dcf6707ab1b18a8b2ff --- /dev/null +++ b/annotations_filtered/wt0klpk3tBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.01], [10.0, 10.25], [14.0, 14.88], [16.0, 16.98], [23.0, 24.38], [27.0, 29.84], [31.0, 43.61], [44.0, 43.7], [48.0, 60.47], [62.0, 64.05], [66.0, 66.68], [73.0, 73.35], [76.0, 76.35], [78.0, 78.8], [81.0, 83.29], [84.0, 84.7], [85.0, 89.06], [100.0, 104.62], [106.0, 113.32], [114.0, 125.79], [128.0, 128.63], [130.0, 130.5], [132.0, 134.47], [141.0, 143.78], [145.0, 148.27], [149.0, 148.95], [149.0, 156.81], [162.0, 162.95], [164.0, 165.32], [166.0, 168.15], [170.0, 170.34], [171.0, 175.86], [177.0, 178.51], [181.0, 181.89], [183.0, 183.83], [187.0, 193.83], [194.0, 199.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 38.19, 0.0, 91.47, 78.21, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 93.91, 40.07, 32.44, 30.97, 0.0, 0.0, 61.97, 66.03, 90.6, 0.0, 93.91, 0.0, 0.0, 96.42, 0.0, 99.26, 0.0, 0.0, 0.0, 95.78, 94.22], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 44.0], ["throbbing", 19.18], ["mains hum", 17.4]], [["music", 39.52], ["speech", 27.65], ["electronic music", 4.93]], null, null, null, null, null, null, null, null, null, null, [["speech", 17.93], ["hum", 13.42], ["music", 7.53]], [["hum", 59.3], ["mains hum", 16.16], ["throbbing", 15.83]], [["speech", 26.34], ["livestock, farm animals, working animals", 19.22], ["cattle, bovinae", 8.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.25, 0.88, 0.98, 1.38, 2.84, 12.61, -0.3, 12.47, 2.05, 0.68, 0.35, 0.35, 0.8, 2.29, 0.7, 4.06, 4.62, 7.32, 11.79, 0.63, 0.5, 2.47, 2.78, 3.27, -0.05, 7.81, 0.95, 1.32, 2.15, 0.34, 4.86, 1.51, 0.89, 0.83, 6.83, 5.61]} \ No newline at end of file diff --git a/annotations_filtered/wtMDZyMGKe0_filtered.json b/annotations_filtered/wtMDZyMGKe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ade1e7acb3b6f159161eea13ae21f731fc7c47bd --- /dev/null +++ b/annotations_filtered/wtMDZyMGKe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 30.91], [32.0, 33.52], [34.0, 33.71], [34.0, 40.73], [48.0, 48.22], [49.0, 49.59], [51.0, 56.12], [60.0, 84.45], [92.0, 92.33], [92.0, 121.44], [125.0, 125.96]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.54, 0.0, 0.0, 56.55, 0.0, 0.0, 31.89, 31.02, 0.0, 30.3, 0.0], "audiomae_on_audioset": [[["music", 46.81], ["swing music", 20.06], ["trombone", 5.27]], null, null, null, null, null, [["music", 37.14], ["drum", 10.48], ["drum kit", 8.08]], [["music", 64.62], ["trombone", 11.07], ["swing music", 7.0]], null, [["music", 56.12], ["swing music", 16.62], ["speech", 9.19]], null], "duration": [14.91, 1.52, -0.29, 6.73, 0.22, 0.59, 5.12, 24.45, 0.33, 29.44, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/wu-RfHKCK7Y_filtered.json b/annotations_filtered/wu-RfHKCK7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wu-RfHKCK7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wuZwdLfxTQ8_filtered.json b/annotations_filtered/wuZwdLfxTQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7174e0adacc55a2ddaa395eb77503e6445a590a7 --- /dev/null +++ b/annotations_filtered/wuZwdLfxTQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [3.0, 5.19], [6.0, 7.13], [10.0, 10.32], [12.0, 13.42], [21.0, 21.19], [23.0, 23.08], [23.0, 23.94], [32.0, 36.32], [37.0, 40.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.59, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 2.19, 1.13, 0.32, 1.42, 0.19, 0.08, 0.94, 4.32, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/wufYHJkbl7k_filtered.json b/annotations_filtered/wufYHJkbl7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..415bda5d8821b8f416b9128c4035bbf98d2ff7f6 --- /dev/null +++ b/annotations_filtered/wufYHJkbl7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.55], [15.0, 14.84], [20.0, 23.89], [41.0, 42.53], [43.0, 44.0], [46.0, 46.36], [47.0, 48.42], [50.0, 51.36], [55.0, 55.66], [57.0, 56.98], [58.0, 57.96], [65.0, 64.81], [67.0, 67.39], [80.0, 80.76], [84.0, 84.99], [92.0, 93.24], [96.0, 95.67], [97.0, 98.69], [100.0, 100.25], [102.0, 102.76], [104.0, 104.45], [108.0, 109.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, -0.16, 3.89, 1.53, 1.0, 0.36, 1.42, 1.36, 0.66, -0.02, -0.04, -0.19, 0.39, 0.76, 0.99, 1.24, -0.33, 1.69, 0.25, 0.76, 0.45, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/wur5ljnTCzQ_filtered.json b/annotations_filtered/wur5ljnTCzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd12ab6f5d609871aefafc03f2bd72e8a735180c --- /dev/null +++ b/annotations_filtered/wur5ljnTCzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 2.93], [9.0, 30.7], [33.0, 37.2], [39.0, 52.08], [58.0, 58.82], [61.0, 68.88], [71.0, 72.37], [77.0, 81.01], [84.0, 84.21], [85.0, 90.66], [96.0, 106.29], [113.0, 114.27], [121.0, 124.56]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 31.08, 32.41, 30.98, 0.0, 31.38, 0.0, 31.34, 0.0, 30.37, 30.63, 0.0, 31.96], "audiomae_on_audioset": [null, null, [["music", 34.61], ["speech", 18.01], ["foghorn", 6.44]], [["music", 55.45], ["theremin", 8.67], ["speech", 7.52]], [["music", 37.31], ["speech", 25.03], ["didgeridoo", 5.11]], null, [["music", 47.15], ["fart", 6.78], ["speech", 5.48]], null, [["music", 83.08], ["theremin", 2.77], ["musical instrument", 2.64]], null, [["music", 72.06], ["theremin", 4.24], ["musical instrument", 3.86]], [["quack", 46.4], ["music", 16.84], ["speech", 10.68]], null, [["speech", 47.64], ["run", 7.54], ["cattle, bovinae", 5.18]]], "duration": [0.5, 1.93, 21.7, 4.2, 13.08, 0.82, 7.88, 1.37, 4.01, 0.21, 5.66, 10.29, 1.27, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/wuzbUsy6snc_filtered.json b/annotations_filtered/wuzbUsy6snc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f616fc37e443f9f67bde32d0872f62ee48c306e8 --- /dev/null +++ b/annotations_filtered/wuzbUsy6snc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.69], [16.0, 16.12], [18.0, 19.99], [21.0, 22.3], [23.0, 23.16], [25.0, 25.69], [27.0, 28.16], [29.0, 31.95], [38.0, 39.09], [42.0, 43.73], [50.0, 56.84], [61.0, 61.6], [65.0, 86.27], [92.0, 94.88], [96.0, 96.11], [96.0, 105.98]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.48, 0.0, 0.0, 29.75, 0.0, 31.89, 30.17, 0.0, 30.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 55.14], ["musical instrument", 6.73], ["guitar", 5.26]], null, null, [["music", 71.85], ["yodeling", 3.43], ["swing music", 2.13]], null, [["music", 53.34], ["synthesizer", 8.18], ["siren", 6.27]], [["music", 60.8], ["synthetic singing", 5.53], ["saxophone", 4.35]], null, [["music", 60.38], ["swing music", 8.76], ["harmonica", 3.17]]], "duration": [0.69, 0.12, 1.99, 1.3, 0.16, 0.69, 1.16, 2.95, 1.09, 1.73, 6.84, 0.6, 21.27, 2.88, 0.11, 9.98]} \ No newline at end of file diff --git a/annotations_filtered/wvPmP4xTruI_filtered.json b/annotations_filtered/wvPmP4xTruI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..894be2d6e35ea14c74aa2051b5f46688efa81e22 --- /dev/null +++ b/annotations_filtered/wvPmP4xTruI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 4.04], [5.0, 5.9], [7.0, 7.13], [11.0, 11.84], [15.0, 16.5], [23.0, 23.41], [30.0, 31.38], [34.0, 34.77], [35.0, 35.21], [35.0, 35.46], [35.0, 35.55], [36.0, 37.62], [41.0, 41.37], [47.0, 48.51], [50.0, 50.77], [51.0, 52.1], [55.0, 55.78], [63.0, 68.86], [71.0, 71.73], [72.0, 76.64], [79.0, 80.05], [94.0, 94.98], [97.0, 97.02], [102.0, 102.76], [104.0, 105.33], [106.0, 106.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.04, 0.9, 0.13, 0.84, 1.5, 0.41, 1.38, 0.77, 0.21, 0.46, 0.55, 1.62, 0.37, 1.51, 0.77, 1.1, 0.78, 5.86, 0.73, 4.64, 1.05, 0.98, 0.02, 0.76, 1.33, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/wvVrDGmqHjI_filtered.json b/annotations_filtered/wvVrDGmqHjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3652e0fe23f53a6227185cb3827b1e68c0eb30fd --- /dev/null +++ b/annotations_filtered/wvVrDGmqHjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [8.0, 9.17], [11.0, 17.93], [19.0, 19.8], [23.0, 25.03], [27.0, 28.86], [32.0, 61.13], [66.0, 66.39], [67.0, 67.14], [72.0, 72.42], [73.0, 73.4], [75.0, 75.63], [78.0, 78.76], [82.0, 82.95], [84.0, 84.0], [87.0, 87.47], [89.0, 94.39], [100.0, 101.78], [106.0, 107.45], [109.0, 110.93], [111.0, 110.96], [111.0, 112.67], [115.0, 121.98]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.28, 0.0, 65.44, 0.0, 31.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48], "audiomae_on_audioset": [null, null, [["speech", 12.22], ["music", 10.77], ["fart", 5.59]], null, null, null, [["speech", 30.86], ["fly, housefly", 11.96], ["insect", 10.2]], null, null, null, null, null, null, null, null, null, [["whack, thwack", 30.58], ["thunk", 21.77], ["speech", 9.88]], null, null, null, null, null, null], "duration": [1.22, 1.17, 6.93, 0.8, 2.03, 1.86, 29.13, 0.39, 0.14, 0.42, 0.4, 0.63, 0.76, 0.95, 0.0, 0.47, 5.39, 1.78, 1.45, 1.93, -0.04, 1.67, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/wwDCSzZx37I_filtered.json b/annotations_filtered/wwDCSzZx37I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a65a03616df5798d493e21140cfb6f83698dea01 --- /dev/null +++ b/annotations_filtered/wwDCSzZx37I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.14], [11.0, 13.61], [16.0, 16.75], [17.0, 19.65], [40.0, 40.09], [43.0, 43.63], [47.0, 47.88], [56.0, 56.0], [58.0, 58.78], [68.0, 68.37], [85.0, 85.14], [86.0, 86.26], [87.0, 87.69], [91.0, 91.77], [92.0, 99.1]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.52, 0.0, 34.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.36], "audiomae_on_audioset": [null, [["speech", 21.11], ["beatboxing", 19.58], ["music", 11.17]], null, [["music", 29.42], ["electric shaver, electric razor", 8.66], ["speech", 7.68]], null, null, null, null, null, null, null, null, null, null, [["speech", 57.49], ["music", 8.05], ["hum", 6.01]]], "duration": [0.14, 2.61, 0.75, 2.65, 0.09, 0.63, 0.88, 0.0, 0.78, 0.37, 0.14, 0.26, 0.69, 0.77, 7.1]} \ No newline at end of file diff --git a/annotations_filtered/wwLnrdD4l3U_filtered.json b/annotations_filtered/wwLnrdD4l3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae2e3dbe130add2c8530be5acc88523794bf99ea --- /dev/null +++ b/annotations_filtered/wwLnrdD4l3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [5.0, 6.61], [8.0, 8.6], [19.0, 18.82], [24.0, 28.12], [30.0, 30.89], [31.0, 40.59], [45.0, 45.39], [49.0, 90.27], [91.0, 95.17], [97.0, 97.12], [100.0, 100.35], [108.0, 108.62], [113.0, 112.89], [113.0, 115.15], [115.0, 117.15], [119.0, 119.47], [130.0, 132.17]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 37.76, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 0.0, 33.81, 32.57, 0.0, 45.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 90.43], ["pig", 1.62], ["animal", 1.08]], null, null, [["speech", 54.91], ["inside, small room", 5.73], ["whack, thwack", 4.3]], null, null, null, null, [["speech", 65.84], ["inside, small room", 2.81], ["music", 2.51]], [["speech", 27.56], ["thunk", 13.04], ["gunshot, gunfire", 7.48]], null, [["speech", 27.52], ["whale vocalization", 14.45], ["cattle, bovinae", 7.42]]], "duration": [0.4, 1.61, 0.6, -0.18, 4.12, 0.89, 9.59, 0.39, 41.27, 4.17, 0.12, 0.35, 0.62, -0.11, 2.15, 2.15, 0.47, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/ww_lUn3jUoA_filtered.json b/annotations_filtered/ww_lUn3jUoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4116a245bb0d9a7e1a7982faeff5067b88e0d332 --- /dev/null +++ b/annotations_filtered/ww_lUn3jUoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.86], [9.0, 9.31], [10.0, 10.03], [10.0, 10.88], [17.0, 17.2], [18.0, 19.9], [21.0, 21.84], [23.0, 23.55], [26.0, 26.91], [39.0, 40.32], [41.0, 42.3], [44.0, 45.79], [48.0, 48.27], [49.0, 49.62], [50.0, 54.23], [55.0, 57.05], [58.0, 58.65], [60.0, 60.35], [63.0, 63.59], [65.0, 65.99], [72.0, 72.62], [73.0, 75.09], [76.0, 80.77], [82.0, 83.1], [84.0, 86.9], [89.0, 91.86], [94.0, 94.51], [95.0, 100.9], [102.0, 103.13], [103.0, 105.02], [106.0, 106.93], [109.0, 110.88], [118.0, 119.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 98.86, 0.0, 99.94, 76.53, 0.0, 62.37, 0.0, 81.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 0.31, 0.03, 0.88, 0.2, 1.9, 0.84, 0.55, 0.91, 1.32, 1.3, 1.79, 0.27, 0.62, 4.23, 2.05, 0.65, 0.35, 0.59, 0.99, 0.62, 2.09, 4.77, 1.1, 2.9, 2.86, 0.51, 5.9, 1.13, 2.02, 0.93, 1.88, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/wwnqJH8OF-I_filtered.json b/annotations_filtered/wwnqJH8OF-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd83984d9216201420f21800fd76d6c5b69ade1 --- /dev/null +++ b/annotations_filtered/wwnqJH8OF-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [12.0, 11.87], [12.0, 11.99], [18.0, 18.39], [19.0, 20.39], [28.0, 30.37], [47.0, 47.76], [53.0, 53.27], [56.0, 57.05], [60.0, 60.05], [61.0, 61.47], [66.0, 70.07], [72.0, 81.85], [83.0, 87.59], [92.0, 92.77], [96.0, 98.12], [102.0, 102.73], [107.0, 107.67], [108.0, 108.51], [116.0, 115.6], [119.0, 122.23], [123.0, 123.42], [130.0, 132.53], [145.0, 145.07], [147.0, 150.62], [157.0, 157.84], [158.0, 158.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 87.55, 41.6, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 40.28, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 58.64], ["groan", 5.8], ["music", 4.3]], null, null, null, null, null, null, null, [["music", 40.04], ["whack, thwack", 6.12], ["fart", 5.92]], null, null, null, null, null, null, [["speech", 48.63], ["ding-dong", 22.55], ["music", 11.79]], null, [["moo", 32.69], ["cattle, bovinae", 30.33], ["livestock, farm animals, working animals", 7.91]], null, null, null, null], "duration": [0.33, -0.13, -0.01, 0.39, 1.39, 2.37, 0.76, 0.27, 1.05, 0.05, 0.47, 4.07, 9.85, 4.59, 0.77, 2.12, 0.73, 0.67, 0.51, -0.4, 3.23, 0.42, 2.53, 0.07, 3.62, 0.84, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/wwoxXiyWf7A_filtered.json b/annotations_filtered/wwoxXiyWf7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b3aec4ef212860d980e412c2e0b729df034d890 --- /dev/null +++ b/annotations_filtered/wwoxXiyWf7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.3], [17.0, 26.72], [27.0, 30.38], [34.0, 34.3], [39.0, 39.34], [42.0, 43.5], [46.0, 46.74], [49.0, 49.54], [50.0, 50.21], [51.0, 53.47], [54.0, 57.1], [59.0, 59.68], [60.0, 60.98], [62.0, 67.22], [67.0, 67.37], [67.0, 71.05], [72.0, 74.11], [75.0, 77.21], [78.0, 81.23], [83.0, 83.35], [84.0, 84.35], [91.0, 91.13], [98.0, 98.42], [100.0, 100.21], [102.0, 102.19], [104.0, 107.16], [113.0, 113.1], [116.0, 116.24], [119.0, 118.81], [133.0, 132.93]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 30.47, 34.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.35, 41.56, 0.0, 0.0, 41.85, 0.0, 35.95, 32.36, 77.03, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 71.81], ["music", 5.21], ["buzz", 5.18]], [["speech", 82.82], ["music", 4.67], ["dial tone", 1.41]], null, null, null, null, null, null, [["mosquito", 25.4], ["music", 16.92], ["fly, housefly", 9.0]], [["moo", 39.64], ["cattle, bovinae", 27.7], ["livestock, farm animals, working animals", 11.87]], null, null, [["music", 22.03], ["theremin", 14.38], ["speech", 13.21]], null, [["animal", 22.5], ["domestic animals, pets", 13.44], ["dog", 11.8]], [["whale vocalization", 9.42], ["whoosh, swoosh, swish", 6.9], ["scrape", 6.22]], null, [["speech", 39.27], ["sidetone", 30.19], ["telephone", 6.43]], null, null, null, null, null, null, [["music", 58.75], ["electronic music", 6.9], ["throbbing", 4.27]], null, null, null, null], "duration": [1.3, 9.72, 3.38, 0.3, 0.34, 1.5, 0.74, 0.54, 0.21, 2.47, 3.1, 0.68, 0.98, 5.22, 0.37, 4.05, 2.11, 2.21, 3.23, 0.35, 0.35, 0.13, 0.42, 0.21, 0.19, 3.16, 0.1, 0.24, -0.19, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/wwwhtUdGOVM_filtered.json b/annotations_filtered/wwwhtUdGOVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e711fd6333db3f83484455371ff9eda0d0344d0c --- /dev/null +++ b/annotations_filtered/wwwhtUdGOVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.17], [21.0, 22.15], [23.0, 23.99], [25.0, 25.41], [28.0, 27.94], [29.0, 30.2], [32.0, 33.18], [34.0, 35.78], [37.0, 39.06], [40.0, 41.59], [42.0, 94.74], [96.0, 97.56], [99.0, 99.01], [100.0, 102.34], [106.0, 109.09], [111.0, 112.02], [113.0, 116.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 100.0, 94.81, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 1.15, 0.99, 0.41, -0.06, 1.2, 1.18, 1.78, 2.06, 1.59, 52.74, 1.56, 0.01, 2.34, 3.09, 1.02, 3.5]} \ No newline at end of file diff --git a/annotations_filtered/wwxjFuoLYzQ_filtered.json b/annotations_filtered/wwxjFuoLYzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f72b31d560931e77f8b5279c82645dee9daf09d5 --- /dev/null +++ b/annotations_filtered/wwxjFuoLYzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [9.0, 9.49], [17.0, 26.05], [26.0, 28.61], [41.0, 41.42], [42.0, 51.48], [52.0, 66.97], [71.0, 83.29], [84.0, 99.72], [102.0, 109.98], [111.0, 112.4], [114.0, 114.84], [119.0, 123.4], [124.0, 127.21], [128.0, 136.22], [147.0, 151.51], [155.0, 155.76], [158.0, 164.44], [167.0, 169.37]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 29.33, 30.31, 0.0, 29.02, 29.27, 28.81, 29.11, 29.2, 0.0, 0.0, 29.42, 29.81, 29.96, 30.56, 0.0, 29.23, 29.95], "audiomae_on_audioset": [null, null, [["music", 56.24], ["speech", 14.53], ["throbbing", 5.96]], [["music", 37.04], ["hum", 18.57], ["throbbing", 18.12]], null, [["music", 41.46], ["vehicle", 12.07], ["speech", 7.77]], [["vehicle", 35.89], ["car", 20.99], ["race car, auto racing", 12.06]], [["buzz", 34.79], ["music", 11.52], ["vehicle", 10.16]], [["music", 57.25], ["dubstep", 12.31], ["electronic music", 12.18]], [["music", 38.33], ["hum", 18.36], ["mains hum", 17.13]], null, null, [["music", 32.54], ["throbbing", 17.45], ["electronic music", 5.38]], [["music", 78.22], ["speech", 8.38], ["throbbing", 1.1]], [["music", 61.45], ["throbbing", 6.44], ["speech", 4.51]], [["throbbing", 40.37], ["music", 31.76], ["hum", 15.57]], null, [["music", 61.37], ["vehicle", 8.32], ["car", 7.56]], [["explosion", 17.29], ["music", 14.54], ["fireworks", 13.01]]], "duration": [1.16, 0.49, 9.05, 2.61, 0.42, 9.48, 14.97, 12.29, 15.72, 7.98, 1.4, 0.84, 4.4, 3.21, 8.22, 4.51, 0.76, 6.44, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/wwzyveUAS80_filtered.json b/annotations_filtered/wwzyveUAS80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc101d8aff2ab8c71a68beb07da9490b642653cf --- /dev/null +++ b/annotations_filtered/wwzyveUAS80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 35.95], [38.0, 41.15], [46.0, 46.14], [46.0, 55.44], [56.0, 70.01], [72.0, 73.48], [75.0, 76.4], [79.0, 87.3], [90.0, 92.82], [95.0, 99.81]], "keep_status": [false, true, false, false, false, false, false, false, true, false], "silence_prob": [31.19, 37.97, 0.0, 33.15, 33.0, 0.0, 0.0, 31.34, 32.34, 35.34], "audiomae_on_audioset": [[["music", 72.81], ["ding", 2.7], ["synthesizer", 2.46]], [["music", 28.73], ["speech", 7.12], ["didgeridoo", 4.28]], null, [["music", 39.23], ["foghorn", 21.47], ["speech", 13.05]], [["music", 58.72], ["throbbing", 15.73], ["synthesizer", 4.06]], null, null, [["music", 64.57], ["didgeridoo", 6.11], ["synthesizer", 4.43]], [["music", 36.75], ["synthesizer", 7.5], ["hum", 7.26]], [["music", 69.59], ["musical instrument", 4.49], ["synthesizer", 3.54]]], "duration": [14.95, 3.15, 0.14, 9.44, 14.01, 1.48, 1.4, 8.3, 2.82, 4.81]} \ No newline at end of file diff --git a/annotations_filtered/wx-HWqbwssg_filtered.json b/annotations_filtered/wx-HWqbwssg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efaeedb0ec42b7a3480a591a752c815ec958c332 --- /dev/null +++ b/annotations_filtered/wx-HWqbwssg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 6.64], [9.0, 10.59], [11.0, 11.84], [13.0, 14.32], [16.0, 17.22], [20.0, 20.55], [27.0, 31.09], [40.0, 42.47], [46.0, 47.9], [49.0, 50.97], [56.0, 56.42], [60.0, 60.03], [62.0, 62.23], [64.0, 65.65], [68.0, 69.69], [71.0, 71.68], [76.0, 76.42], [77.0, 77.68], [79.0, 80.1], [83.0, 84.72], [85.0, 87.98], [91.0, 91.62], [93.0, 93.95], [97.0, 97.02], [98.0, 99.33], [106.0, 107.1], [108.0, 111.37], [123.0, 126.59], [133.0, 133.34], [134.0, 134.3]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 0.0, 33.65, 33.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 27.8], ["speech", 14.58], ["hum", 12.68]], [["hum", 31.8], ["mains hum", 11.63], ["dial tone", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.9], ["mains hum", 11.18], ["hum", 7.91]], null, null, null, null, null, [["music", 47.0], ["hum", 11.61], ["sine wave", 7.32]], [["speech", 23.01], ["chirp tone", 18.7], ["sine wave", 15.09]], null, null], "duration": [1.83, 1.64, 1.59, 0.84, 1.32, 1.22, 0.55, 4.09, 2.47, 1.9, 1.97, 0.42, 0.03, 0.23, 1.65, 1.69, 0.68, 0.42, 0.68, 1.1, 1.72, 2.98, 0.62, 0.95, 0.02, 1.33, 1.1, 3.37, 3.59, 0.34, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/wxV84RoUr_U_filtered.json b/annotations_filtered/wxV84RoUr_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23bf4178cc091200984672566f2acd2529bce478 --- /dev/null +++ b/annotations_filtered/wxV84RoUr_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.21], [8.0, 8.24], [8.0, 16.23], [22.0, 22.67], [28.0, 29.12], [29.0, 37.42], [39.0, 39.16], [40.0, 45.45], [47.0, 47.14], [51.0, 51.76], [56.0, 56.62], [59.0, 60.3], [62.0, 63.78], [67.0, 68.05], [74.0, 75.22], [77.0, 77.75], [80.0, 80.37], [83.0, 84.2]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.08, 0.0, 30.02, 0.0, 0.0, 32.83, 0.0, 32.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.29], ["hum", 15.34], ["didgeridoo", 7.46]], null, [["music", 53.51], ["didgeridoo", 14.61], ["hum", 8.72]], null, null, [["music", 68.8], ["hum", 8.39], ["throbbing", 7.77]], null, [["music", 38.71], ["throbbing", 14.15], ["speech", 13.07]], null, null, null, null, null, null, null, null, null, null], "duration": [6.21, 0.24, 8.23, 0.67, 1.12, 8.42, 0.16, 5.45, 0.14, 0.76, 0.62, 1.3, 1.78, 1.05, 1.22, 0.75, 0.37, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/wxb_X12HZWQ_filtered.json b/annotations_filtered/wxb_X12HZWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c42001993950a7de5abd0c5cf7337f4b2e992d1 --- /dev/null +++ b/annotations_filtered/wxb_X12HZWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.19], [20.0, 20.17], [21.0, 21.41], [26.0, 25.88], [27.0, 27.26], [37.0, 37.37], [45.0, 44.88], [49.0, 49.54], [72.0, 72.98], [99.0, 99.49], [100.0, 100.95], [102.0, 103.28], [104.0, 104.99], [107.0, 109.7], [112.0, 113.91], [125.0, 125.93], [128.0, 128.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.17, 0.41, -0.12, 0.26, 0.37, -0.12, 0.54, 0.98, 0.49, 0.95, 1.28, 0.99, 2.7, 1.91, 0.93, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/wxhUTK7xbz8_filtered.json b/annotations_filtered/wxhUTK7xbz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1a0037de620226e9a99d7d1bab9d07706049422 --- /dev/null +++ b/annotations_filtered/wxhUTK7xbz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.77], [24.0, 25.14], [26.0, 26.18], [28.0, 29.05], [30.0, 31.41], [32.0, 33.42], [34.0, 35.48], [37.0, 37.79], [42.0, 42.84], [44.0, 44.46], [47.0, 47.76], [49.0, 50.41], [52.0, 54.53], [56.0, 59.41], [61.0, 63.27], [65.0, 66.28], [67.0, 69.08], [70.0, 71.19], [73.0, 74.51], [75.0, 76.99], [77.0, 78.75], [80.0, 82.34], [83.0, 87.13], [89.0, 90.81], [92.0, 92.58], [94.0, 93.82], [97.0, 98.34], [104.0, 108.33], [109.0, 111.05], [112.0, 112.45], [114.0, 114.54], [119.0, 121.09], [124.0, 124.77], [126.0, 127.99], [132.0, 136.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 100.0, 87.37, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 99.21, 95.91, 0.0, 0.0, 0.0, 0.0, 96.89, 79.24, 0.0, 0.0, 83.52, 0.0, 0.0, 97.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.77, 1.14, 0.18, 1.05, 1.41, 1.42, 1.48, 0.79, 0.84, 0.46, 0.76, 1.41, 2.53, 3.41, 2.27, 1.28, 2.08, 1.19, 1.51, 1.99, 1.75, 2.34, 4.13, 1.81, 0.58, -0.18, 1.34, 4.33, 2.05, 0.45, 0.54, 2.09, 0.77, 1.99, 4.7]} \ No newline at end of file diff --git a/annotations_filtered/wxlD2wwIgVk_filtered.json b/annotations_filtered/wxlD2wwIgVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/wxlD2wwIgVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/wxrmK9esHpc_filtered.json b/annotations_filtered/wxrmK9esHpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15d8d882aa94bd8636a267e9bc9de15fd8aa4c19 --- /dev/null +++ b/annotations_filtered/wxrmK9esHpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 59.81], [60.0, 70.56], [81.0, 128.63]], "keep_status": [false, true, false], "silence_prob": [0.0, 32.77, 0.0], "audiomae_on_audioset": [null, [["boing", 26.61], ["music", 22.29], ["speech", 18.72]], null], "duration": [30.81, 10.56, 47.63]} \ No newline at end of file diff --git a/annotations_filtered/wy1eWsC2sL8_filtered.json b/annotations_filtered/wy1eWsC2sL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73109e5ada4553da2fa0cd5c7e3c60d58b83903d --- /dev/null +++ b/annotations_filtered/wy1eWsC2sL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [9.0, 9.26], [11.0, 11.38], [16.0, 19.35], [20.0, 33.47], [37.0, 38.89], [40.0, 54.14], [54.0, 64.67], [66.0, 113.88], [117.0, 131.45], [134.0, 141.78], [143.0, 144.78]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 65.91, 47.39, 0.0, 50.51, 46.43, 0.0, 48.95, 37.08, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 51.38], ["mains hum", 10.09], ["speech", 8.38]], null, null, [["hum", 42.92], ["mains hum", 41.64], ["telephone bell ringing", 3.79]], null, [["music", 78.66], ["synthesizer", 2.88], ["telephone bell ringing", 2.73]], [["music", 31.71], ["telephone bell ringing", 25.76], ["thunk", 8.78]], null], "duration": [0.14, 0.26, 0.38, 3.35, 13.47, 1.89, 14.14, 10.67, 47.88, 14.45, 7.78, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/wyHOKleZzFM_filtered.json b/annotations_filtered/wyHOKleZzFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28ffa8d45f08a613b5beef5b353011f3342254c2 --- /dev/null +++ b/annotations_filtered/wyHOKleZzFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.75], [13.0, 33.49], [34.0, 34.3], [34.0, 44.86], [47.0, 48.83], [54.0, 56.19], [57.0, 56.74], [57.0, 56.86], [57.0, 56.89], [57.0, 58.95], [62.0, 67.46], [68.0, 73.79], [75.0, 75.46], [76.0, 76.94], [78.0, 89.68], [108.0, 114.83], [118.0, 119.28], [120.0, 129.46], [130.0, 133.14]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 42.98, 0.0, 45.36, 0.0, 39.3, 0.0, 0.0, 0.0, 0.0, 42.08, 29.42, 0.0, 0.0, 33.24, 36.52, 0.0, 28.63, 28.76], "audiomae_on_audioset": [null, [["sidetone", 53.03], ["speech", 25.88], ["noise", 5.88]], null, [["speech", 45.22], ["rumble", 4.9], ["whale vocalization", 4.03]], null, [["speech", 34.12], ["cattle, bovinae", 10.63], ["moo", 6.33]], null, null, null, null, [["throbbing", 31.64], ["speech", 26.77], ["hum", 18.5]], [["speech", 45.2], ["explosion", 17.27], ["vehicle", 7.94]], null, null, [["speech", 44.55], ["sidetone", 7.51], ["fly, housefly", 5.25]], [["speech", 40.57], ["fart", 13.61], ["animal", 6.8]], null, [["speech", 17.79], ["outside, rural or natural", 11.66], ["groan", 7.27]], [["whale vocalization", 93.8], ["cattle, bovinae", 1.55], ["livestock, farm animals, working animals", 0.73]]], "duration": [-0.25, 20.49, 0.3, 10.86, 1.83, 2.19, -0.26, -0.14, -0.11, 1.95, 5.46, 5.79, 0.46, 0.94, 11.68, 6.83, 1.28, 9.46, 3.14]} \ No newline at end of file diff --git a/annotations_filtered/wyKfuDzbbOI_filtered.json b/annotations_filtered/wyKfuDzbbOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..783a77d85715c72b7dfe6ecda0ae1248757be1f6 --- /dev/null +++ b/annotations_filtered/wyKfuDzbbOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [5.0, 7.3], [9.0, 10.5], [13.0, 13.41], [23.0, 23.82], [29.0, 28.78], [33.0, 34.75], [37.0, 37.94], [40.0, 40.95], [45.0, 46.52], [53.0, 77.67], [97.0, 101.12], [117.0, 117.05], [120.0, 120.88]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.09, 29.71, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 31.58], ["synthesizer", 10.64], ["electronic music", 8.35]], null, null, null, null, null, null, null, null, [["music", 77.97], ["musical instrument", 4.85], ["effects unit", 3.59]], [["music", 26.0], ["didgeridoo", 10.71], ["cattle, bovinae", 10.45]], null, null], "duration": [0.51, 2.3, 1.5, 0.41, 0.82, -0.22, 1.75, 0.94, 0.95, 1.52, 24.67, 4.12, 0.05, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/wyMDViXXXXU_filtered.json b/annotations_filtered/wyMDViXXXXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecaef0c24f3351042e139374afbc6e106c78bf83 --- /dev/null +++ b/annotations_filtered/wyMDViXXXXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.99], [1.0, 1.02], [2.0, 1.66], [2.0, 1.7], [2.0, 1.8], [2.0, 1.86], [2.0, 2.0], [2.0, 2.07], [2.0, 2.1], [2.0, 2.13], [2.0, 2.17], [2.0, 2.2], [2.0, 2.24], [2.0, 2.27], [3.0, 7.1], [13.0, 15.79], [19.0, 144.63], [146.0, 146.28], [147.0, 148.19], [150.0, 152.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.02, 41.01, 0.0, 0.0, 0.0, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.58], ["music", 17.73], ["whack, thwack", 8.22]], [["hum", 37.72], ["throbbing", 21.97], ["mains hum", 14.0]], null, null, null, null], "duration": [0.99, 0.02, -0.34, -0.3, -0.2, -0.14, 0.0, 0.07, 0.1, 0.13, 0.17, 0.2, 0.24, 0.27, 4.1, 2.79, 125.63, 0.28, 1.19, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/wyQmO-LFF4M_filtered.json b/annotations_filtered/wyQmO-LFF4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ca157425898c347b1b5cae4f33eec8b47d2c24f --- /dev/null +++ b/annotations_filtered/wyQmO-LFF4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [6.0, 7.57], [9.0, 10.25], [13.0, 14.03], [15.0, 24.56], [28.0, 29.37], [31.0, 33.49], [35.0, 36.76], [37.0, 38.28], [41.0, 47.36], [48.0, 50.9], [51.0, 54.04], [55.0, 58.51], [60.0, 68.82], [69.0, 71.34], [72.0, 75.76], [78.0, 81.09], [82.0, 83.93], [85.0, 86.43], [89.0, 92.97], [96.0, 121.76], [122.0, 128.48], [132.0, 156.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 100.0, 0.0, 0.0, 98.66, 100.0, 71.43, 100.0, 99.98, 99.21, 100.0, 99.93, 0.0, 0.0, 52.33, 100.0, 86.27, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 1.57, 1.25, 1.03, 9.56, 1.37, 2.49, 1.76, 1.28, 6.36, 2.9, 3.04, 3.51, 8.82, 2.34, 3.76, 3.09, 1.93, 1.43, 3.97, 25.76, 6.48, 24.78]} \ No newline at end of file diff --git a/annotations_filtered/wyRq2S8BTVM_filtered.json b/annotations_filtered/wyRq2S8BTVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e12f692e010e6bf36e1b1bd521e5a741cff2ef6 --- /dev/null +++ b/annotations_filtered/wyRq2S8BTVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.15], [16.0, 16.7], [17.0, 17.37], [18.0, 19.01], [23.0, 28.26], [30.0, 30.15], [30.0, 33.59], [34.0, 49.81]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [88.1, 0.0, 0.0, 0.0, 43.3, 0.0, 91.3, 67.38], "audiomae_on_audioset": [null, null, null, null, [["noise", 21.38], ["hum", 11.81], ["sidetone", 10.62]], null, null, null], "duration": [6.15, 0.7, 0.37, 1.01, 5.26, 0.15, 3.59, 15.81]} \ No newline at end of file diff --git a/annotations_filtered/wySz6ysIDhs_filtered.json b/annotations_filtered/wySz6ysIDhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..524401c4a0c00238a0b5f3469d05e45352202cc1 --- /dev/null +++ b/annotations_filtered/wySz6ysIDhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [4.0, 4.75], [6.0, 6.72], [8.0, 9.31], [13.0, 13.54], [14.0, 14.47], [16.0, 15.84], [17.0, 17.41], [19.0, 19.06], [20.0, 20.76], [21.0, 21.56], [23.0, 23.85], [26.0, 26.01], [26.0, 26.69], [30.0, 30.74], [37.0, 37.05], [42.0, 42.3], [45.0, 44.73], [47.0, 47.6], [49.0, 50.13], [52.0, 52.34], [54.0, 54.35], [55.0, 55.7], [57.0, 63.59], [65.0, 66.39], [67.0, 73.74], [74.0, 74.83], [76.0, 76.59], [78.0, 78.6], [79.0, 81.33], [82.0, 82.49], [84.0, 84.32], [85.0, 88.53], [89.0, 89.72], [90.0, 90.9], [92.0, 92.33], [95.0, 95.28], [96.0, 97.8], [98.0, 98.78], [101.0, 101.34], [102.0, 101.85], [102.0, 103.22], [105.0, 106.1], [108.0, 108.23], [109.0, 110.0], [112.0, 112.7], [113.0, 113.98], [115.0, 115.11], [118.0, 118.67], [120.0, 120.45], [121.0, 122.32], [123.0, 124.07], [126.0, 126.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 37.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.64], ["music", 4.14], ["thunk", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.75, 0.72, 1.31, 0.54, 0.47, -0.16, 0.41, 0.06, 0.76, 0.56, 0.85, 0.01, 0.69, 0.74, 0.05, 0.3, -0.27, 0.6, 1.13, 0.34, 0.35, 0.7, 6.59, 1.39, 6.74, 0.83, 0.59, 0.6, 2.33, 0.49, 0.32, 3.53, 0.72, 0.9, 0.33, 0.28, 1.8, 0.78, 0.34, -0.15, 1.22, 1.1, 0.23, 1.0, 0.7, 0.98, 0.11, 0.67, 0.45, 1.32, 1.07, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/wyifbBO6sAY_filtered.json b/annotations_filtered/wyifbBO6sAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21088980a63ad2831985483d9aa25204be3da01d --- /dev/null +++ b/annotations_filtered/wyifbBO6sAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.37], [11.0, 12.29], [17.0, 35.78], [38.0, 67.44], [69.0, 68.94], [69.0, 72.4], [80.0, 91.64], [94.0, 96.9], [97.0, 107.4], [109.0, 117.68], [119.0, 125.54], [131.0, 131.62], [136.0, 136.61], [140.0, 140.85], [142.0, 149.39], [151.0, 152.9], [155.0, 156.17], [157.0, 157.35], [158.0, 164.03], [168.0, 169.74], [170.0, 176.64]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 74.6, 36.84, 0.0, 34.04, 37.58, 37.69, 40.47, 33.55, 34.29, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 71.72, 0.0, 50.97], "audiomae_on_audioset": [null, null, null, [["music", 47.2], ["musical instrument", 11.42], ["guitar", 6.4]], null, [["aircraft", 7.86], ["hum", 7.76], ["mains hum", 6.58]], [["speech", 40.26], ["music", 19.12], ["hum", 8.41]], [["music", 70.22], ["ambient music", 6.89], ["throbbing", 2.83]], [["speech", 42.11], ["music", 17.51], ["hum", 10.64]], [["speech", 46.06], ["music", 19.56], ["musical instrument", 5.5]], [["music", 57.57], ["speech", 21.42], ["hum", 6.18]], null, null, null, null, null, null, null, null, null, null], "duration": [2.37, 1.29, 18.78, 29.44, -0.06, 3.4, 11.64, 2.9, 10.4, 8.68, 6.54, 0.62, 0.61, 0.85, 7.39, 1.9, 1.17, 0.35, 6.03, 1.74, 6.64]} \ No newline at end of file diff --git a/annotations_filtered/wytpJXfw86w_filtered.json b/annotations_filtered/wytpJXfw86w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acc13140513018046d1dace69e81e8276462ff06 --- /dev/null +++ b/annotations_filtered/wytpJXfw86w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [8.0, 20.02], [24.0, 58.73], [66.0, 65.94], [67.0, 83.13], [84.0, 105.49], [107.0, 118.89], [119.0, 120.33], [121.0, 125.0], [125.0, 145.44], [147.0, 150.47], [152.0, 162.85], [163.0, 165.23], [167.0, 168.89], [169.0, 175.15]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 29.37, 0.0, 0.0, 46.05, 65.79, 59.42, 0.0, 47.86, 60.79, 73.21, 64.75, 50.21, 0.0, 44.49], "audiomae_on_audioset": [null, [["music", 49.58], ["thump, thud", 5.84], ["hum", 5.38]], null, null, [["hum", 37.45], ["mains hum", 22.54], ["throbbing", 11.75]], null, null, null, [["music", 27.8], ["speech", 17.55], ["hum", 7.3]], null, null, null, null, null, [["music", 20.21], ["speech", 12.52], ["cattle, bovinae", 8.45]]], "duration": [0.29, 12.02, 34.73, -0.06, 16.13, 21.49, 11.89, 1.33, 4.0, 20.44, 3.47, 10.85, 2.23, 1.89, 6.15]} \ No newline at end of file diff --git a/annotations_filtered/wytwlFfk5dY_filtered.json b/annotations_filtered/wytwlFfk5dY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65df449e9cfd7a53330f500fedfdb56777c70282 --- /dev/null +++ b/annotations_filtered/wytwlFfk5dY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [5.0, 7.06], [9.0, 9.98], [10.0, 11.96], [14.0, 15.58], [16.0, 16.95], [18.0, 19.13], [21.0, 21.34], [23.0, 24.93], [26.0, 27.41], [30.0, 30.82], [32.0, 33.22], [40.0, 42.38], [44.0, 45.1], [49.0, 49.2], [53.0, 54.65], [55.0, 57.18], [58.0, 60.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.22, 0.0, 0.0, 0.0, 34.82, 77.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.15], ["music", 21.05], ["singing bowl", 10.72]], null, null, null, [["music", 51.56], ["speech", 17.97], ["musical instrument", 4.5]], null], "duration": [0.75, 2.06, 0.98, 1.96, 1.58, 0.95, 1.13, 0.34, 1.93, 1.41, 0.82, 1.22, 2.38, 1.1, 0.2, 1.65, 2.18, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/wyuPoWs79fo_filtered.json b/annotations_filtered/wyuPoWs79fo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4db63291aa8abaf8336cf977d919cc1483de6d71 --- /dev/null +++ b/annotations_filtered/wyuPoWs79fo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.13], [10.0, 13.05], [15.0, 16.53], [17.0, 103.76], [106.0, 109.98], [112.0, 114.22], [115.0, 116.97], [118.0, 119.48], [120.0, 128.02], [129.0, 140.91]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [92.48, 52.62, 0.0, 0.0, 81.17, 89.54, 0.0, 0.0, 83.7, 40.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sonar", 21.11], ["hum", 15.91], ["music", 13.79]]], "duration": [5.13, 3.05, 1.53, 86.76, 3.98, 2.22, 1.97, 1.48, 8.02, 11.91]} \ No newline at end of file diff --git a/annotations_filtered/wz29yiGSrB0_filtered.json b/annotations_filtered/wz29yiGSrB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e91b5ace111ce7a3c4a4201292a07fc027f06a1b --- /dev/null +++ b/annotations_filtered/wz29yiGSrB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.77], [16.0, 29.51], [30.0, 33.88]], "keep_status": [false, false, true], "silence_prob": [0.0, 43.69, 36.37], "audiomae_on_audioset": [null, [["music", 53.16], ["theremin", 15.33], ["effects unit", 6.32]], [["music", 26.1], ["siren", 20.04], ["theremin", 8.11]]], "duration": [0.77, 13.51, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/wz4HLeURVOQ_filtered.json b/annotations_filtered/wz4HLeURVOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db8352aac5a96700900e710c88cbe1e78fb28a01 --- /dev/null +++ b/annotations_filtered/wz4HLeURVOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.36], [38.0, 46.95], [52.0, 64.07], [70.0, 70.53], [71.0, 71.41], [77.0, 77.41], [78.0, 78.81], [81.0, 81.99], [84.0, 84.18], [84.0, 85.33], [86.0, 86.34], [87.0, 89.97], [92.0, 106.0], [114.0, 115.38], [119.0, 119.43]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.58, 40.5, 37.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.25, 37.88, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 44.17], ["moo", 23.42], ["livestock, farm animals, working animals", 22.83]], [["music", 37.19], ["theremin", 19.05], ["hum", 11.02]], [["music", 67.7], ["synthesizer", 6.17], ["musical instrument", 3.98]], null, null, null, null, null, null, null, null, null, [["music", 38.24], ["fart", 31.34], ["speech", 13.34]], null, null], "duration": [7.36, 8.95, 12.07, 0.53, 0.41, 0.41, 0.81, 0.99, 0.18, 1.33, 0.34, 2.97, 14.0, 1.38, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/wzIwPkZkSTk_filtered.json b/annotations_filtered/wzIwPkZkSTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64f7b1cc505d3a538445a14164ba8ae24ddf63e8 --- /dev/null +++ b/annotations_filtered/wzIwPkZkSTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.99], [9.0, 20.92], [22.0, 23.68], [26.0, 30.18], [33.0, 35.38], [40.0, 40.85], [43.0, 45.0], [48.0, 49.84], [52.0, 54.62], [56.0, 57.84], [59.0, 63.05]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [36.92, 65.91, 0.0, 72.46, 43.35, 0.0, 86.64, 0.0, 85.54, 0.0, 84.43], "audiomae_on_audioset": [[["whale vocalization", 68.47], ["speech", 19.07], ["hum", 4.19]], null, null, null, [["cattle, bovinae", 12.84], ["moo", 12.33], ["frog", 9.15]], null, null, null, null, null, null], "duration": [4.99, 11.92, 1.68, 4.18, 2.38, 0.85, 2.0, 1.84, 2.62, 1.84, 4.05]} \ No newline at end of file diff --git a/annotations_filtered/wzJObNk-flo_filtered.json b/annotations_filtered/wzJObNk-flo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae5e4dda666ae6848d6d07f0a2698f65bfffe412 --- /dev/null +++ b/annotations_filtered/wzJObNk-flo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 59.81], [61.0, 71.96]], "keep_status": [false, false], "silence_prob": [0.0, 29.47], "audiomae_on_audioset": [null, [["music", 71.94], ["quack", 3.7], ["reggae", 3.07]]], "duration": [43.81, 10.96]} \ No newline at end of file diff --git a/annotations_filtered/wzSYH0nT6Qk_filtered.json b/annotations_filtered/wzSYH0nT6Qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dc40143158192342462edec5c28f77bd18c136d --- /dev/null +++ b/annotations_filtered/wzSYH0nT6Qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 55.36], [56.0, 56.67], [57.0, 68.22], [83.0, 90.71], [92.0, 94.12], [100.0, 100.2], [102.0, 102.52]], "keep_status": [false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 31.56, 35.33, 48.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 89.11], ["music", 3.96], ["speech", 3.29]], [["speech", 37.32], ["didgeridoo", 8.19], ["cattle, bovinae", 6.14]], [["speech", 27.81], ["didgeridoo", 12.52], ["music", 6.86]], null, null], "duration": [52.36, 0.67, 11.22, 7.71, 2.12, 0.2, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/wzYht_EEf0U_filtered.json b/annotations_filtered/wzYht_EEf0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13ab4443386c96f761082d197bab1b268c41f83b --- /dev/null +++ b/annotations_filtered/wzYht_EEf0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 98.91], [100.0, 99.82], [101.0, 104.53], [107.0, 112.45]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 33.63, 32.28], "audiomae_on_audioset": [null, null, [["music", 54.15], ["didgeridoo", 20.18], ["speech", 4.82]], [["music", 56.44], ["musical instrument", 7.44], ["synthesizer", 5.18]]], "duration": [0.91, -0.18, 3.53, 5.45]} \ No newline at end of file diff --git a/annotations_filtered/wzZ3S0ZC1Is_filtered.json b/annotations_filtered/wzZ3S0ZC1Is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78ca59ae3ab8cdaa4fdb75593ad561360dc221b3 --- /dev/null +++ b/annotations_filtered/wzZ3S0ZC1Is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 11.42], [12.0, 12.83], [14.0, 17.34], [20.0, 20.93], [29.0, 34.48], [36.0, 37.44], [39.0, 44.42], [46.0, 47.21], [48.0, 49.49], [50.0, 51.0], [51.0, 51.65], [52.0, 53.42], [56.0, 60.0], [64.0, 64.32], [64.0, 64.35], [67.0, 76.42], [83.0, 88.5], [91.0, 94.42], [100.0, 100.48], [101.0, 101.17], [103.0, 109.41], [110.0, 110.67], [113.0, 113.85], [116.0, 121.66], [122.0, 122.98], [124.0, 124.21], [125.0, 125.2], [127.0, 131.57], [133.0, 138.38], [140.0, 144.83], [153.0, 154.28], [157.0, 156.91], [158.0, 159.81], [161.0, 161.45]], "keep_status": [false, false, false, true, false, true, false, true, false, false, false, false, false, true, false, false, false, true, true, false, false, true, false, false, true, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 33.17, 0.0, 34.67, 0.0, 33.67, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 34.51, 0.0, 0.0, 32.63, 32.41, 32.79, 0.0, 0.0, 32.84, 0.0, 0.0, 32.98, 0.0, 0.0, 0.0, 31.76, 32.45, 33.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.31], ["musical instrument", 13.76], ["theremin", 3.01]], null, [["music", 29.17], ["trombone", 19.81], ["brass instrument", 16.52]], null, [["music", 43.74], ["musical instrument", 8.97], ["echo", 5.53]], null, [["music", 48.8], ["didgeridoo", 5.26], ["musical instrument", 4.69]], null, null, null, null, null, [["speech", 31.4], ["music", 23.18], ["trombone", 7.96]], null, null, [["music", 64.78], ["musical instrument", 6.2], ["trombone", 4.66]], [["music", 21.83], ["didgeridoo", 12.95], ["theremin", 11.51]], [["music", 44.22], ["musical instrument", 7.35], ["saxophone", 6.36]], null, null, [["music", 43.77], ["brass instrument", 15.83], ["musical instrument", 9.88]], null, null, [["music", 39.88], ["brass instrument", 9.77], ["trombone", 8.56]], null, null, null, [["music", 66.16], ["musical instrument", 6.85], ["brass instrument", 3.07]], [["music", 31.21], ["brass instrument", 14.45], ["trombone", 11.84]], [["music", 36.49], ["brass instrument", 18.68], ["musical instrument", 13.08]], null, null, null, null], "duration": [1.13, 8.42, 0.83, 3.34, 0.93, 5.48, 1.44, 5.42, 1.21, 1.49, 1.0, 0.65, 1.42, 4.0, 0.32, 0.35, 9.42, 5.5, 3.42, 0.48, 0.17, 6.41, 0.67, 0.85, 5.66, 0.98, 0.21, 0.2, 4.57, 5.38, 4.83, 1.28, -0.09, 1.81, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/wz_y0fibuQE_filtered.json b/annotations_filtered/wz_y0fibuQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bf36662ab1c03f96938bcf66c4713a45ef92533 --- /dev/null +++ b/annotations_filtered/wz_y0fibuQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.37], [13.0, 62.28], [63.0, 64.25], [65.0, 66.73], [69.0, 74.11], [77.0, 77.45], [84.0, 86.81]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.41, 0.0, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.37, 49.28, 1.25, 1.73, 5.11, 0.45, 2.81]} \ No newline at end of file