diff --git a/annotations_filtered/e-5SVm2NUe8_filtered.json b/annotations_filtered/e-5SVm2NUe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8992e4046421d2acb624d0a3d9fbdfb7a2a9c42e --- /dev/null +++ b/annotations_filtered/e-5SVm2NUe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.34], [14.0, 16.06], [19.0, 19.68], [31.0, 32.22], [37.0, 37.44], [39.0, 39.55], [42.0, 46.14], [48.0, 49.1], [54.0, 54.75], [71.0, 72.67], [75.0, 75.47], [76.0, 78.31], [82.0, 94.93], [96.0, 96.96], [98.0, 98.79], [100.0, 100.65], [103.0, 103.91], [110.0, 110.98], [112.0, 112.56], [117.0, 117.95], [120.0, 119.84], [122.0, 123.06], [124.0, 124.83]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.27, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 36.18, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 40.92], ["speech", 15.39], ["radio", 6.02]], null, null, null, null, null, null, null, null, null, [["speech", 57.64], ["sidetone", 8.31], ["radio", 4.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 2.06, 0.68, 1.22, 0.44, 0.55, 4.14, 1.1, 0.75, 1.67, 0.47, 2.31, 12.93, 0.96, 0.79, 0.65, 0.91, 0.98, 0.56, 0.95, -0.16, 1.06, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/e-6fZ7wiPQk_filtered.json b/annotations_filtered/e-6fZ7wiPQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68219c682b276fd00f5ac072eca19a8dc329b6ee --- /dev/null +++ b/annotations_filtered/e-6fZ7wiPQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 38.55], [41.0, 99.42], [100.0, 103.05], [104.0, 108.03], [109.0, 110.69], [112.0, 115.11], [118.0, 129.64], [131.0, 138.43]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [34.46, 0.0, 96.29, 98.8, 0.0, 87.55, 32.29, 32.31], "audiomae_on_audioset": [[["hum", 47.98], ["mains hum", 22.12], ["music", 14.06]], null, null, null, null, null, [["hum", 38.82], ["mains hum", 34.86], ["throbbing", 8.39]], [["noise", 14.56], ["speech", 9.28], ["hum", 6.82]]], "duration": [7.55, 58.42, 3.05, 4.03, 1.69, 3.11, 11.64, 7.43]} \ No newline at end of file diff --git a/annotations_filtered/e-NMI6o5ynk_filtered.json b/annotations_filtered/e-NMI6o5ynk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2bb5390e82e0d15dd6ba2d9fcbc565ce242aad8 --- /dev/null +++ b/annotations_filtered/e-NMI6o5ynk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.82], [12.0, 13.2], [14.0, 15.67], [16.0, 27.33], [31.0, 32.07], [33.0, 51.56]], "keep_status": [false, false, false, false, false, false], "silence_prob": [35.1, 0.0, 0.0, 33.47, 0.0, 32.65], "audiomae_on_audioset": [[["music", 80.14], ["synthesizer", 1.36], ["sampler", 1.24]], null, null, [["music", 79.07], ["throbbing", 1.48], ["sampler", 1.31]], null, [["music", 71.27], ["singing", 3.02], ["didgeridoo", 2.96]]], "duration": [2.82, 1.2, 1.67, 11.33, 1.07, 18.56]} \ No newline at end of file diff --git a/annotations_filtered/e-oTHFL5_ec_filtered.json b/annotations_filtered/e-oTHFL5_ec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e471e7626000d896d2ab6b83479bc8adfa04fdcb --- /dev/null +++ b/annotations_filtered/e-oTHFL5_ec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [12.0, 12.97], [15.0, 15.36], [17.0, 17.34], [19.0, 19.26], [27.0, 27.6], [35.0, 35.95], [37.0, 37.91], [39.0, 39.45], [41.0, 42.47], [46.0, 46.36], [50.0, 50.6], [72.0, 73.77], [74.0, 77.52], [78.0, 78.31], [82.0, 85.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 33.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 41.31], ["moo", 26.89], ["cattle, bovinae", 16.38]]], "duration": [0.59, 0.97, 0.36, 0.34, 0.26, 0.6, 0.95, 0.91, 0.45, 1.47, 0.36, 0.6, 1.77, 3.52, 0.31, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/e0HzBST_794_filtered.json b/annotations_filtered/e0HzBST_794_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..779a2e2191018a8b0206d12dd87a89ceb49791c1 --- /dev/null +++ b/annotations_filtered/e0HzBST_794_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.86], [6.0, 15.9], [18.0, 19.84], [27.0, 34.37], [35.0, 49.94], [66.0, 66.11], [68.0, 69.35], [90.0, 90.17], [94.0, 99.76], [105.0, 112.06], [124.0, 157.06], [157.0, 157.1], [157.0, 157.13], [157.0, 157.17]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 31.34, 0.0, 30.99, 32.63, 0.0, 0.0, 0.0, 35.36, 32.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 46.24], ["cattle, bovinae", 21.08], ["moo", 11.12]], null, [["moo", 35.5], ["cattle, bovinae", 33.52], ["livestock, farm animals, working animals", 25.6]], [["animal", 63.47], ["grunt", 17.72], ["livestock, farm animals, working animals", 3.93]], null, null, null, [["music", 22.85], ["whack, thwack", 14.08], ["speech", 13.15]], [["boing", 24.17], ["speech", 15.59], ["music", 14.44]], null, null, null, null], "duration": [-0.14, 9.9, 1.84, 7.37, 14.94, 0.11, 1.35, 0.17, 5.76, 7.06, 33.06, 0.1, 0.13, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/e0UZ0rc0KH4_filtered.json b/annotations_filtered/e0UZ0rc0KH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3b51e72f765c63077da9ce45390b815fc3b5662 --- /dev/null +++ b/annotations_filtered/e0UZ0rc0KH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.88], [10.0, 10.5], [11.0, 11.67], [13.0, 13.1], [13.0, 14.88], [16.0, 23.33], [24.0, 34.57], [37.0, 36.98], [37.0, 37.66], [44.0, 50.04], [52.0, 51.83], [52.0, 56.54], [57.0, 59.61], [61.0, 61.75], [63.0, 63.42], [64.0, 65.31], [66.0, 75.52], [78.0, 80.69], [82.0, 82.73], [86.0, 86.12], [87.0, 87.02], [90.0, 92.18], [93.0, 98.05], [99.0, 99.44], [100.0, 100.84], [104.0, 105.29], [106.0, 115.64], [119.0, 119.65], [120.0, 125.27], [126.0, 130.0], [131.0, 133.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.56, 57.32, 0.0, 0.0, 58.89, 0.0, 52.45, 60.14, 0.0, 0.0, 0.0, 46.43, 58.89, 0.0, 0.0, 0.0, 77.7, 64.07, 0.0, 0.0, 0.0, 78.89, 0.0, 71.43, 69.2, 63.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.08], ["hum", 20.56], ["throbbing", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.5, 0.67, 0.1, 1.88, 7.33, 10.57, -0.02, 0.66, 6.04, -0.17, 4.54, 2.61, 0.75, 0.42, 1.31, 9.52, 2.69, 0.73, 0.12, 0.02, 2.18, 5.05, 0.44, 0.84, 1.29, 9.64, 0.65, 5.27, 4.0, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/e0cR6R3SccI_filtered.json b/annotations_filtered/e0cR6R3SccI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc4fcad7ab4cff6274d87b136a1470a1ad0deae --- /dev/null +++ b/annotations_filtered/e0cR6R3SccI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 28.07], [31.0, 50.21]], "keep_status": [false, false], "silence_prob": [0.0, 66.15], "audiomae_on_audioset": [null, null], "duration": [1.07, 19.21]} \ No newline at end of file diff --git a/annotations_filtered/e0d5svC0xQU_filtered.json b/annotations_filtered/e0d5svC0xQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6aa197f253ae53efcab764032fad7360c65c7896 --- /dev/null +++ b/annotations_filtered/e0d5svC0xQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.44], [20.0, 20.78], [21.0, 23.23], [26.0, 30.45], [31.0, 31.41], [34.0, 34.05], [44.0, 48.0], [48.0, 48.61], [52.0, 53.92], [55.0, 56.86], [59.0, 58.89], [61.0, 61.74], [64.0, 64.18], [66.0, 67.15]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.77, 0.0, 59.15, 52.39, 0.0, 0.0, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.53], ["throbbing", 10.18], ["hum", 8.84]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.44, 0.78, 2.23, 4.45, 0.41, 0.05, 4.0, 0.61, 1.92, 1.86, -0.11, 0.74, 0.18, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/e0fFbNV1ySY_filtered.json b/annotations_filtered/e0fFbNV1ySY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15bc2ca4077a26c29fbc34a24803da5a9dbaceac --- /dev/null +++ b/annotations_filtered/e0fFbNV1ySY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.67], [19.0, 20.76], [25.0, 25.88], [27.0, 28.38], [29.0, 43.44], [45.0, 45.49], [49.0, 50.53], [52.0, 53.28], [54.0, 54.82], [58.0, 58.4], [60.0, 70.92], [72.0, 75.15], [76.0, 77.95], [80.0, 92.99], [93.0, 96.69]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.98, 0.0, 0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 71.43, 0.0, 69.07, 80.64], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 48.61], ["gong", 9.73], ["music", 9.58]], null, null, null, null, null, null, null, null, null, null], "duration": [11.67, 1.76, 0.88, 1.38, 14.44, 0.49, 1.53, 1.28, 0.82, 0.4, 10.92, 3.15, 1.95, 12.99, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/e0qpJCNLViQ_filtered.json b/annotations_filtered/e0qpJCNLViQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5edcf903ac93a46200f9fa4449fde9bd810220c --- /dev/null +++ b/annotations_filtered/e0qpJCNLViQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [8.0, 8.24], [30.0, 30.42], [31.0, 33.52], [36.0, 37.34], [41.0, 42.11], [45.0, 53.86], [61.0, 70.02], [70.0, 71.69], [74.0, 74.7], [76.0, 78.09], [79.0, 80.15], [82.0, 84.5], [85.0, 86.41], [90.0, 90.71], [91.0, 101.02], [101.0, 102.54], [105.0, 106.51], [108.0, 108.48], [109.0, 110.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 41.12, 41.54, 0.0, 0.0, 100.0, 0.0, 99.96, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.23], ["speech", 28.7], ["hip hop music", 5.37]], [["sidetone", 47.08], ["music", 30.24], ["speech", 6.44]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.24, 0.42, 2.52, 1.34, 1.11, 8.86, 9.02, 1.69, 0.7, 2.09, 1.15, 2.5, 1.41, 0.71, 10.02, 1.54, 1.51, 0.48, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/e198XToyAkk_filtered.json b/annotations_filtered/e198XToyAkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f3f3a094afcbbba59d2555e3da78de62b17ab4f --- /dev/null +++ b/annotations_filtered/e198XToyAkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [35.0, 35.58], [41.0, 41.47], [49.0, 49.72], [52.0, 51.75], [64.0, 65.48], [67.0, 66.93], [68.0, 74.49], [76.0, 75.96], [78.0, 77.95], [95.0, 97.78], [103.0, 103.84], [115.0, 115.52], [136.0, 136.81], [138.0, 138.43], [146.0, 148.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 35.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 72.9], ["speech", 11.73], ["wail, moan", 3.73]], null, null, [["music", 77.4], ["musical instrument", 5.51], ["synthesizer", 3.79]], null, null, null, null, [["boing", 36.42], ["speech", 18.1], ["ding", 6.88]]], "duration": [0.1, 0.58, 0.47, 0.72, -0.25, 1.48, -0.07, 6.49, -0.04, -0.05, 2.78, 0.84, 0.52, 0.81, 0.43, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/e1DnltskkWk_filtered.json b/annotations_filtered/e1DnltskkWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d68ac68dc8ce5a42dd9e333ec984f964f4777891 --- /dev/null +++ b/annotations_filtered/e1DnltskkWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [45.0, 46.68], [57.0, 58.06], [59.0, 59.64], [62.0, 62.36], [63.0, 63.34], [66.0, 66.55], [68.0, 68.93], [74.0, 75.12], [78.0, 79.96], [86.0, 86.66], [87.0, 87.24], [88.0, 89.06], [96.0, 97.31], [99.0, 99.84], [104.0, 105.33], [106.0, 106.66], [108.0, 109.56], [113.0, 114.2], [117.0, 117.27], [127.0, 127.13], [128.0, 130.45], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 1.68, 1.06, 0.64, 0.36, 0.34, 0.55, 0.93, 1.12, 1.96, 0.66, 0.24, 1.06, 1.31, 0.84, 1.33, 0.66, 1.56, 1.2, 0.27, 0.13, 2.45, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/e1FWoMLjAU0_filtered.json b/annotations_filtered/e1FWoMLjAU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..536c72b9ab7c550cdaf7649ed71db5e75e50b3dc --- /dev/null +++ b/annotations_filtered/e1FWoMLjAU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.79], [63.0, 63.86], [65.0, 65.97], [71.0, 72.82], [73.0, 74.76], [76.0, 77.41], [79.0, 81.35], [83.0, 84.21], [86.0, 86.54], [88.0, 90.14], [90.0, 93.43], [94.0, 95.3], [97.0, 97.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 77.03, 50.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.86, 0.97, 1.82, 1.76, 1.41, 2.35, 1.21, 0.54, 2.14, 3.43, 1.3, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/e1bMBM_rgwQ_filtered.json b/annotations_filtered/e1bMBM_rgwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f7f4ee98e0bf704609326268e83c80669f6f257 --- /dev/null +++ b/annotations_filtered/e1bMBM_rgwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.32], [14.0, 15.79], [18.0, 19.4], [20.0, 21.63], [26.0, 26.33], [31.0, 31.68], [36.0, 36.34], [42.0, 46.47], [52.0, 53.08], [54.0, 54.65], [57.0, 57.69], [58.0, 59.0], [60.0, 62.26], [67.0, 69.62], [71.0, 71.85]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 0.0, 0.0, 0.0, 0.0, 45.92, 46.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 18.86], ["radio", 10.34], ["noise", 9.59]], null, null, null, null, [["hum", 26.18], ["throbbing", 14.56], ["mains hum", 13.05]], [["speech", 21.24], ["hum", 20.28], ["radio", 17.07]], null], "duration": [1.32, 1.79, 1.4, 1.63, 0.33, 0.68, 0.34, 4.47, 1.08, 0.65, 0.69, 1.0, 2.26, 2.62, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/e2-VnrdN_Ng_filtered.json b/annotations_filtered/e2-VnrdN_Ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9808306b602d78436833f2aeb1b37c8574249768 --- /dev/null +++ b/annotations_filtered/e2-VnrdN_Ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [3.0, 3.0], [4.0, 4.08], [8.0, 7.69], [16.0, 17.02], [18.0, 19.4], [23.0, 23.36], [24.0, 25.46], [34.0, 36.78], [41.0, 42.62], [47.0, 59.29], [60.0, 122.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 67.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.0, 0.08, -0.31, 1.02, 1.4, 0.36, 1.46, 2.78, 1.62, 12.29, 62.72]} \ No newline at end of file diff --git a/annotations_filtered/e2FdM0YQSHk_filtered.json b/annotations_filtered/e2FdM0YQSHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ac35a0934bf47e518c58b69d9670fde00c41ef2 --- /dev/null +++ b/annotations_filtered/e2FdM0YQSHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.37], [25.0, 26.1], [28.0, 28.26], [30.0, 39.5], [41.0, 63.61]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.31, 54.23], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.37, 1.1, 0.26, 9.5, 22.61]} \ No newline at end of file diff --git a/annotations_filtered/e2Odq49gEbs_filtered.json b/annotations_filtered/e2Odq49gEbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24bddffff265f59ab53f42e9136b0c2de7f979ba --- /dev/null +++ b/annotations_filtered/e2Odq49gEbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.28], [24.0, 38.79], [47.0, 47.02], [53.0, 54.04], [55.0, 55.09], [56.0, 61.87], [64.0, 72.6], [74.0, 75.41], [82.0, 92.38], [94.0, 98.05], [100.0, 107.42], [108.0, 108.89], [110.0, 110.83], [112.0, 112.33], [114.0, 114.67], [115.0, 117.61], [119.0, 120.43], [131.0, 131.43]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.35, 46.15, 0.0, 0.0, 0.0, 40.16, 40.9, 0.0, 51.28, 73.06, 73.67, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.47], ["hum", 21.39], ["mains hum", 7.8]], [["noise", 31.02], ["hum", 27.41], ["music", 10.65]], null, null, null, [["music", 37.27], ["speech", 24.44], ["synthesizer", 6.19]], [["music", 53.75], ["throbbing", 11.1], ["hum", 8.26]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.28, 14.79, 0.02, 1.04, 0.09, 5.87, 8.6, 1.41, 10.38, 4.05, 7.42, 0.89, 0.83, 0.33, 0.67, 2.61, 1.43, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/e2RQwVyRSGU_filtered.json b/annotations_filtered/e2RQwVyRSGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62d408ffe3ffb41172e93985ed4711f2d2ac0911 --- /dev/null +++ b/annotations_filtered/e2RQwVyRSGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.78], [31.0, 32.09], [38.0, 39.11], [40.0, 40.27], [42.0, 43.02], [45.0, 48.59], [65.0, 65.57], [67.0, 99.01]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.78, 1.09, 1.11, 0.27, 1.02, 3.59, 0.57, 32.01]} \ No newline at end of file diff --git a/annotations_filtered/e2dAiCB6igE_filtered.json b/annotations_filtered/e2dAiCB6igE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f068ad82f8c2fba909e4acfc89c68cb0292185f --- /dev/null +++ b/annotations_filtered/e2dAiCB6igE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.0], [16.0, 16.44], [22.0, 22.64], [24.0, 24.75], [28.0, 29.44], [30.0, 31.21], [33.0, 34.42], [39.0, 40.61], [52.0, 52.44], [57.0, 57.84], [61.0, 64.77], [67.0, 69.38], [71.0, 70.87], [72.0, 73.79], [82.0, 88.25], [91.0, 91.84], [93.0, 93.68], [101.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 99.91, 0.0, 0.0, 42.67, 0.0, 0.0, 30.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.51], ["fly, housefly", 8.75], ["buzz", 3.29]], null, null, [["music", 30.06], ["fly, housefly", 7.36], ["mosquito", 6.73]]], "duration": [1.0, 0.44, 0.64, 0.75, 1.44, 1.21, 1.42, 1.61, 0.44, 0.84, 3.77, 2.38, -0.13, 1.79, 6.25, 0.84, 0.68, 6.86]} \ No newline at end of file diff --git a/annotations_filtered/e2g4Wr81rz8_filtered.json b/annotations_filtered/e2g4Wr81rz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb373153d26c66c0080b703486131db2dfb5f955 --- /dev/null +++ b/annotations_filtered/e2g4Wr81rz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [10.0, 10.66], [24.0, 24.53], [28.0, 28.21], [33.0, 33.49], [51.0, 54.28], [91.0, 93.23], [94.0, 103.82], [111.0, 116.94], [129.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 98.27, 99.93, 34.37, 37.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 25.95], ["cattle, bovinae", 14.05], ["moo", 12.65]], [["speech", 26.35], ["cattle, bovinae", 11.16], ["moo", 8.22]]], "duration": [1.3, 0.66, 0.53, 0.21, 0.49, 3.28, 2.23, 9.82, 5.94, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/e2xiwiWd_sM_filtered.json b/annotations_filtered/e2xiwiWd_sM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fce300391276a79c780498bd9f07e6f21eceada --- /dev/null +++ b/annotations_filtered/e2xiwiWd_sM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [2.0, 13.12], [14.0, 14.23], [15.0, 15.89], [17.0, 18.42], [19.0, 20.28], [22.0, 22.27], [23.0, 25.19], [31.0, 31.02], [32.0, 38.21], [40.0, 41.44], [42.0, 44.68], [47.0, 48.3], [49.0, 51.81], [53.0, 54.11], [54.0, 55.22], [56.0, 57.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 48.39, 0.0, 97.0, 0.0, 76.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 20.91], ["door", 9.88], ["noise", 8.75]], null, null, null, null, null, null, null], "duration": [0.22, 11.12, 0.23, 0.89, 1.42, 1.28, 0.27, 2.19, 0.02, 6.21, 1.44, 2.68, 1.3, 2.81, 1.11, 1.22, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/e3BZn-XJ4mU_filtered.json b/annotations_filtered/e3BZn-XJ4mU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2529c6881564014a6fafbcd77b29321b31553cbe --- /dev/null +++ b/annotations_filtered/e3BZn-XJ4mU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 35.53], [36.0, 35.58], [36.0, 44.9], [46.0, 49.57], [50.0, 73.52], [75.0, 74.87], [76.0, 78.11], [80.0, 93.9], [97.0, 97.77], [100.0, 111.28], [112.0, 114.76], [117.0, 120.88], [121.0, 129.71], [130.0, 134.22], [137.0, 142.28], [143.0, 143.77]], "keep_status": [true, false, false, true, false, false, true, true, false, false, true, true, true, true, true, false], "silence_prob": [28.15, 0.0, 31.04, 31.14, 29.69, 0.0, 29.67, 27.86, 0.0, 28.48, 29.48, 29.45, 29.51, 28.81, 29.46, 0.0], "audiomae_on_audioset": [[["explosion", 20.85], ["music", 10.57], ["whack, thwack", 7.35]], null, [["speech", 66.87], ["music", 7.8], ["breaking", 2.28]], [["music", 52.39], ["hum", 2.64], ["vehicle", 2.21]], [["livestock, farm animals, working animals", 40.85], ["cattle, bovinae", 28.52], ["moo", 9.5]], null, [["sound effect", 13.32], ["whale vocalization", 12.86], ["roar", 8.7]], [["explosion", 15.17], ["rumble", 14.42], ["music", 6.74]], null, [["music", 72.89], ["throbbing", 6.81], ["hum", 6.34]], [["speech", 10.31], ["hum", 9.14], ["whack, thwack", 8.64]], [["music", 28.39], ["whack, thwack", 8.72], ["throbbing", 8.18]], [["music", 36.92], ["whack, thwack", 9.25], ["clang", 8.34]], [["music", 54.73], ["speech", 7.26], ["boing", 5.89]], [["ding", 31.02], ["boing", 11.6], ["music", 11.59]], null], "duration": [12.53, -0.42, 8.9, 3.57, 23.52, -0.13, 2.11, 13.9, 0.77, 11.28, 2.76, 3.88, 8.71, 4.22, 5.28, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/e3mwmwPhr08_filtered.json b/annotations_filtered/e3mwmwPhr08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c532e0cbde3ba3b53f3b36191847703621a047ff --- /dev/null +++ b/annotations_filtered/e3mwmwPhr08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 30.7], [32.0, 33.52], [36.0, 36.46], [37.0, 38.03], [41.0, 41.77], [44.0, 45.06], [51.0, 51.31], [52.0, 54.55], [57.0, 58.67], [60.0, 61.26], [65.0, 67.37], [68.0, 71.58], [73.0, 75.64], [79.0, 79.47], [80.0, 82.09], [84.0, 86.49], [89.0, 90.59], [95.0, 95.32], [98.0, 98.9], [102.0, 102.91], [104.0, 105.92], [106.0, 108.3], [110.0, 112.65], [114.0, 115.43], [119.0, 121.9], [127.0, 130.38], [131.0, 131.9], [133.0, 133.89], [136.0, 136.68], [138.0, 139.04], [141.0, 143.94], [145.0, 146.72], [148.0, 151.33], [153.0, 156.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 98.1, 94.95, 0.0, 92.8, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.01, 100.0, 0.0, 64.75, 57.09, 0.0, 0.0, 0.0, 0.0, 49.68, 0.0, 56.55, 60.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.67], ["sine wave", 22.69], ["singing bowl", 7.04]], null, null, null, null, null, null, null, null, [["gong", 30.58], ["music", 28.16], ["singing bowl", 10.96]], null, null, null], "duration": [2.7, 1.52, 0.46, 1.03, 0.77, 1.06, 0.31, 2.55, 1.67, 1.26, 2.37, 3.58, 2.64, 0.47, 2.09, 2.49, 1.59, 0.32, 0.9, 0.91, 1.92, 2.3, 2.65, 1.43, 2.9, 3.38, 0.9, 0.89, 0.68, 1.04, 2.94, 1.72, 3.33, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/e4-STTC0pNc_filtered.json b/annotations_filtered/e4-STTC0pNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1acdbc3e510d031fcc31e26ef5b5e7577b0e0972 --- /dev/null +++ b/annotations_filtered/e4-STTC0pNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 39.83], [41.0, 64.45], [67.0, 75.76], [78.0, 78.44], [80.0, 81.06], [82.0, 87.96], [89.0, 101.93], [102.0, 102.17], [106.0, 109.83]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [69.07, 75.72, 99.99, 0.0, 0.0, 99.97, 69.61, 0.0, 41.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 63.15], ["theremin", 16.52], ["ambient music", 6.96]]], "duration": [5.83, 23.45, 8.76, 0.44, 1.06, 5.96, 12.93, 0.17, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/e434wHYilA0_filtered.json b/annotations_filtered/e434wHYilA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a1aed6b93c60b677ffb03c92d61996c1dd70cbd --- /dev/null +++ b/annotations_filtered/e434wHYilA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.04], [9.0, 10.72], [13.0, 13.05], [18.0, 25.19], [27.0, 27.51], [28.0, 28.29], [29.0, 30.4], [32.0, 33.93], [35.0, 35.16], [36.0, 47.36], [48.0, 48.68], [50.0, 57.35], [60.0, 67.63], [68.0, 69.16], [71.0, 71.39], [75.0, 75.0], [77.0, 77.85], [79.0, 82.68], [87.0, 88.06], [89.0, 89.78], [90.0, 89.85], [90.0, 93.93], [94.0, 104.55], [106.0, 105.93], [108.0, 108.75], [109.0, 110.22], [111.0, 111.81], [112.0, 118.12], [121.0, 130.32], [132.0, 147.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [58.22, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 0.0, 45.88, 0.0, 40.24, 45.08, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0, 0.0, 44.32, 40.88, 0.0, 0.0, 0.0, 0.0, 33.28, 32.46, 29.75], "audiomae_on_audioset": [null, null, null, [["speech", 60.94], ["radio", 31.31], ["hum", 1.04]], null, null, null, null, null, [["mains hum", 59.72], ["hum", 24.53], ["speech", 8.86]], null, [["speech", 73.11], ["radio", 8.72], ["mains hum", 3.79]], [["music", 25.7], ["hum", 19.16], ["mains hum", 14.47]], null, null, null, null, [["music", 40.55], ["hum", 11.37], ["didgeridoo", 7.63]], null, null, null, [["music", 17.28], ["radio", 14.73], ["hum", 12.96]], [["speech", 35.86], ["hum", 23.66], ["mains hum", 22.62]], null, null, null, null, [["music", 19.86], ["speech", 12.88], ["cough", 9.91]], [["music", 36.19], ["speech", 26.44], ["didgeridoo", 4.66]], [["hum", 48.66], ["mains hum", 31.37], ["throbbing", 6.21]]], "duration": [7.04, 1.72, 0.05, 7.19, 0.51, 0.29, 1.4, 1.93, 0.16, 11.36, 0.68, 7.35, 7.63, 1.16, 0.39, 0.0, 0.85, 3.68, 1.06, 0.78, -0.15, 3.93, 10.55, -0.07, 0.75, 1.22, 0.81, 6.12, 9.32, 15.88]} \ No newline at end of file diff --git a/annotations_filtered/e48T01eVXtU_filtered.json b/annotations_filtered/e48T01eVXtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d23c29423f83d21063b1a26b88032ce4027483 --- /dev/null +++ b/annotations_filtered/e48T01eVXtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.52], [12.0, 12.23], [21.0, 22.49], [37.0, 44.41], [48.0, 49.92], [52.0, 56.61], [57.0, 58.36], [65.0, 68.84], [73.0, 74.48], [75.0, 75.22], [76.0, 81.7], [91.0, 91.47], [92.0, 94.53], [96.0, 99.2], [102.0, 103.32], [104.0, 108.65], [109.0, 108.9], [110.0, 110.17], [113.0, 114.52], [117.0, 118.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false], "silence_prob": [38.15, 0.0, 0.0, 30.13, 0.0, 30.45, 0.0, 29.71, 0.0, 0.0, 30.93, 0.0, 30.46, 32.8, 0.0, 30.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 43.41], ["cattle, bovinae", 28.68], ["moo", 14.11]], null, null, [["music", 42.17], ["speech", 24.34], ["cattle, bovinae", 5.57]], null, [["moo", 42.12], ["cattle, bovinae", 26.57], ["livestock, farm animals, working animals", 9.8]], null, [["music", 59.82], ["speech", 17.54], ["boing", 5.08]], null, null, [["fly, housefly", 24.32], ["mosquito", 18.31], ["music", 16.1]], null, [["music", 45.94], ["boing", 12.05], ["speech", 5.94]], [["music", 40.04], ["speech", 9.65], ["musical instrument", 9.28]], null, [["cattle, bovinae", 23.48], ["moo", 21.46], ["fart", 11.48]], null, null, null, null], "duration": [7.52, 0.23, 1.49, 7.41, 1.92, 4.61, 1.36, 3.84, 1.48, 0.22, 5.7, 0.47, 2.53, 3.2, 1.32, 4.65, -0.1, 0.17, 1.52, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/e4Dlc6yqJuA_filtered.json b/annotations_filtered/e4Dlc6yqJuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..235efaa26013283e0a0b96fba1839414e0e6722c --- /dev/null +++ b/annotations_filtered/e4Dlc6yqJuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.73], [14.0, 16.58], [18.0, 42.06], [45.0, 45.47], [47.0, 48.05]], "keep_status": [false, false, true, false, false], "silence_prob": [90.43, 89.9, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 40.2], ["hum", 19.74], ["mains hum", 7.03]], null, null], "duration": [4.73, 2.58, 24.06, 0.47, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/e4RGh5iAykY_filtered.json b/annotations_filtered/e4RGh5iAykY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98fcbae64572e9df81020b716a7efb2b300f041c --- /dev/null +++ b/annotations_filtered/e4RGh5iAykY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.28], [13.0, 13.61], [16.0, 16.93], [18.0, 17.81], [20.0, 20.76], [23.0, 24.06], [26.0, 29.47], [30.0, 30.7], [34.0, 34.72], [38.0, 41.05], [43.0, 42.84], [45.0, 45.01], [48.0, 48.24], [51.0, 51.7], [55.0, 63.58], [64.0, 64.88], [66.0, 74.43], [75.0, 76.03], [86.0, 86.36], [87.0, 88.48], [89.0, 89.65], [90.0, 94.39], [108.0, 108.33], [115.0, 115.3], [117.0, 117.51], [118.0, 119.01], [121.0, 121.37], [123.0, 125.2], [127.0, 127.6], [128.0, 134.67], [136.0, 136.49], [137.0, 139.14], [143.0, 143.11], [144.0, 149.15], [150.0, 151.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.06, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [[["music", 56.5], ["theremin", 14.16], ["musical instrument", 4.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.28, 0.61, 0.93, -0.19, 0.76, 1.06, 3.47, 0.7, 0.72, 3.05, -0.16, 0.01, 0.24, 0.7, 8.58, 0.88, 8.43, 1.03, 0.36, 1.48, 0.65, 4.39, 0.33, 0.3, 0.51, 1.01, 0.37, 2.2, 0.6, 6.67, 0.49, 2.14, 0.11, 5.15, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/e4yCxKv-2qw_filtered.json b/annotations_filtered/e4yCxKv-2qw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72e125d8cd22f52a769f396fc8dfbd72ef149d22 --- /dev/null +++ b/annotations_filtered/e4yCxKv-2qw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [6.0, 8.77], [11.0, 12.46], [14.0, 16.16], [20.0, 22.86], [24.0, 28.93], [30.0, 31.56], [33.0, 35.16], [36.0, 36.58], [37.0, 39.33], [41.0, 41.64], [45.0, 44.98], [46.0, 48.22], [50.0, 51.75], [52.0, 53.65], [55.0, 55.59], [59.0, 59.61], [60.0, 60.45], [61.0, 61.05], [67.0, 67.61], [68.0, 67.64], [70.0, 71.0], [76.0, 75.98], [77.0, 77.06], [78.0, 80.84], [82.0, 84.15], [85.0, 86.56], [88.0, 88.4], [89.0, 90.31], [91.0, 93.63], [97.0, 99.54], [101.0, 101.09], [102.0, 103.1], [104.0, 104.5], [106.0, 106.79], [110.0, 110.37], [111.0, 112.31], [114.0, 114.3], [116.0, 118.39]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.09, 0.0, 36.08, 72.75, 68.41, 0.0, 52.86, 0.0, 50.61, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 41.89, 0.0, 0.0, 0.0, 72.16, 60.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [null, [["sound effect", 15.56], ["dishes, pots, and pans", 10.82], ["grunt", 7.11]], null, [["creak", 21.53], ["speech", 20.32], ["tick-tock", 17.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 39.02], ["sheep", 9.53], ["bleat", 7.17]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 2.77, 1.46, 2.16, 2.86, 4.93, 1.56, 2.16, 0.58, 2.33, 0.64, -0.02, 2.22, 1.75, 1.65, 0.59, 0.61, 0.45, 0.05, 0.61, -0.36, 1.0, -0.02, 0.06, 2.84, 2.15, 1.56, 0.4, 1.31, 2.63, 2.54, 0.09, 1.1, 0.5, 0.79, 0.37, 1.31, 0.3, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/e56FOw5rIhw_filtered.json b/annotations_filtered/e56FOw5rIhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..707598d521f5aed2cf1ece65c944a5435a51886c --- /dev/null +++ b/annotations_filtered/e56FOw5rIhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 50.28], [51.0, 77.95]], "keep_status": [false, false], "silence_prob": [0.0, 30.83], "audiomae_on_audioset": [null, [["music", 56.45], ["throbbing", 10.65], ["musical instrument", 4.5]]], "duration": [0.28, 26.95]} \ No newline at end of file diff --git a/annotations_filtered/e5LZR3vCkzo_filtered.json b/annotations_filtered/e5LZR3vCkzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af3689afb1730ee77c57ec550a720ecf591eecf1 --- /dev/null +++ b/annotations_filtered/e5LZR3vCkzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.13], [10.0, 10.88], [13.0, 14.5], [16.0, 20.17], [27.0, 64.5], [66.0, 66.46], [70.0, 78.75], [79.0, 80.33], [81.0, 108.63]], "keep_status": [false, false, false, true, false, false, false, false, true], "silence_prob": [60.42, 0.0, 0.0, 35.0, 0.0, 0.0, 32.52, 0.0, 30.57], "audiomae_on_audioset": [null, null, null, [["music", 36.42], ["throbbing", 16.46], ["hum", 16.37]], null, null, [["music", 68.46], ["speech", 5.44], ["throbbing", 4.54]], null, [["music", 42.24], ["speech", 12.1], ["whack, thwack", 10.14]]], "duration": [3.13, 0.88, 1.5, 4.17, 37.5, 0.46, 8.75, 1.33, 27.63]} \ No newline at end of file diff --git a/annotations_filtered/e5SbxMFk6Vo_filtered.json b/annotations_filtered/e5SbxMFk6Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d67fb57a88e2c7e03bc731490e95399866dab9a --- /dev/null +++ b/annotations_filtered/e5SbxMFk6Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [7.0, 7.6], [9.0, 10.89], [23.0, 23.4], [27.0, 27.14], [37.0, 36.8], [50.0, 50.48], [53.0, 53.33], [57.0, 60.72], [64.0, 67.34], [70.0, 69.72], [70.0, 69.75], [70.0, 79.74], [84.0, 94.56], [103.0, 102.78], [103.0, 118.83], [120.0, 120.06], [126.0, 126.3]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.3, 30.29, 0.0, 0.0, 30.23, 30.0, 0.0, 30.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 55.26], ["speech", 15.52], ["electronic music", 3.52]], [["music", 54.58], ["speech", 9.73], ["boing", 4.41]], null, null, [["music", 74.44], ["speech", 10.08], ["didgeridoo", 4.33]], [["music", 55.45], ["brass instrument", 8.85], ["trombone", 4.94]], null, [["livestock, farm animals, working animals", 31.77], ["music", 18.64], ["moo", 17.12]], null, null], "duration": [0.88, 0.6, 1.89, 0.4, 0.14, -0.2, 0.48, 0.33, 3.72, 3.34, -0.28, -0.25, 9.74, 10.56, -0.22, 15.83, 0.06, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/e5Tb2YSkGh0_filtered.json b/annotations_filtered/e5Tb2YSkGh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1c6a705daa331a518944ae6d87501bd063a89d4 --- /dev/null +++ b/annotations_filtered/e5Tb2YSkGh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [7.0, 7.5], [10.0, 10.49], [15.0, 15.36], [26.0, 27.8], [28.0, 28.95], [29.0, 29.67], [40.0, 67.64]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["radio", 46.5], ["noise", 8.36], ["sidetone", 5.75]]], "duration": [0.29, 0.5, 0.49, 0.36, 1.8, 0.95, 0.67, 27.64]} \ No newline at end of file diff --git a/annotations_filtered/e5cg1EeFISo_filtered.json b/annotations_filtered/e5cg1EeFISo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91d8d4497fbfe35fb60226aabcabb30a65f078db --- /dev/null +++ b/annotations_filtered/e5cg1EeFISo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.04], [9.0, 9.07], [30.0, 30.27], [39.0, 40.47], [50.0, 50.77], [74.0, 74.6], [76.0, 75.83], [91.0, 91.03], [103.0, 106.86], [109.0, 109.76], [127.0, 127.01], [128.0, 128.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.07, 0.27, 1.47, 0.77, 0.6, -0.17, 0.03, 3.86, 0.76, 0.01, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/e6B-T4KYIFQ_filtered.json b/annotations_filtered/e6B-T4KYIFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..815885a22353b1ce15a8abb21898376c1b1c10e1 --- /dev/null +++ b/annotations_filtered/e6B-T4KYIFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.64], [8.0, 29.32], [32.0, 33.89], [36.0, 38.58], [39.0, 38.75], [39.0, 39.04], [39.0, 49.54], [54.0, 56.76], [58.0, 59.64], [63.0, 73.3], [77.0, 98.63], [103.0, 105.61], [106.0, 118.56], [126.0, 126.32], [127.0, 143.04]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 49.04, 0.0, 46.19, 0.0, 0.0, 48.74, 94.22, 0.0, 47.78, 35.4, 30.67, 33.5, 0.0, 39.91], "audiomae_on_audioset": [null, [["music", 32.85], ["speech", 9.39], ["boing", 8.27]], null, [["speech", 20.76], ["music", 6.79], ["singing bowl", 3.8]], null, null, [["music", 35.7], ["speech", 29.53], ["whack, thwack", 6.13]], null, null, [["music", 66.71], ["electronic music", 4.64], ["thunk", 3.67]], [["music", 60.17], ["electronic music", 6.74], ["ambient music", 5.88]], [["speech", 32.66], ["sheep", 22.94], ["bleat", 13.85]], [["music", 71.56], ["scary music", 6.47], ["speech", 4.28]], null, [["speech", 58.1], ["animal", 14.81], ["dog", 5.38]]], "duration": [1.64, 21.32, 1.89, 2.58, -0.25, 0.04, 10.54, 2.76, 1.64, 10.3, 21.63, 2.61, 12.56, 0.32, 16.04]} \ No newline at end of file diff --git a/annotations_filtered/e6WyN4z0VGc_filtered.json b/annotations_filtered/e6WyN4z0VGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14f0bd3c67d423fce88cfc4ca59b507d86582410 --- /dev/null +++ b/annotations_filtered/e6WyN4z0VGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.23], [5.0, 6.02], [6.0, 8.8], [9.0, 11.65], [13.0, 14.35], [15.0, 17.73], [21.0, 26.77], [27.0, 29.0], [30.0, 34.89], [36.0, 36.95], [40.0, 41.76], [45.0, 48.1], [50.0, 54.45], [56.0, 58.55], [59.0, 63.37], [64.0, 65.18], [66.0, 66.55], [69.0, 70.56], [72.0, 73.06], [74.0, 85.06], [86.0, 96.03], [98.0, 98.49], [101.0, 102.84], [105.0, 105.46], [108.0, 108.55], [109.0, 110.79], [113.0, 113.98], [117.0, 117.96], [122.0, 123.15], [124.0, 124.63], [130.0, 130.1], [131.0, 132.26], [135.0, 138.28], [141.0, 141.61], [145.0, 144.71], [147.0, 147.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.43, 0.0, 91.3, 99.68, 0.0, 100.0, 100.0, 86.09, 100.0, 0.0, 0.0, 99.97, 100.0, 81.35, 100.0, 0.0, 0.0, 0.0, 0.0, 99.1, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 1.02, 2.8, 2.65, 1.35, 2.73, 5.77, 2.0, 4.89, 0.95, 1.76, 3.1, 4.45, 2.55, 4.37, 1.18, 0.55, 1.56, 1.06, 11.06, 10.03, 0.49, 1.84, 0.46, 0.55, 1.79, 0.98, 0.96, 1.15, 0.63, 0.1, 1.26, 3.28, 0.61, -0.29, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/e6omnFC9jC4_filtered.json b/annotations_filtered/e6omnFC9jC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef59c8b4346713e58762b5af40a2645b134330b0 --- /dev/null +++ b/annotations_filtered/e6omnFC9jC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [6.0, 7.05], [14.0, 14.86], [16.0, 21.66], [23.0, 26.03], [27.0, 28.07], [29.0, 44.91], [46.0, 47.01], [48.0, 48.49], [54.0, 57.3], [58.0, 59.36], [60.0, 66.45], [68.0, 71.34], [72.0, 73.16], [74.0, 74.04], [74.0, 78.56], [81.0, 82.58], [84.0, 86.27], [87.0, 88.23], [91.0, 92.67], [94.0, 96.47], [99.0, 100.5], [103.0, 104.18], [105.0, 106.24], [109.0, 111.82], [112.0, 113.04], [114.0, 114.59], [116.0, 118.74], [122.0, 123.33]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.4, 47.78, 0.0, 62.78, 0.0, 0.0, 79.94, 0.0, 80.64, 64.29, 0.0, 0.0, 37.25, 0.0, 61.37, 0.0, 0.0, 70.86, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 54.7, 0.0], "audiomae_on_audioset": [null, null, null, [["eruption", 23.02], ["hum", 15.35], ["explosion", 12.45]], [["hum", 17.43], ["mains hum", 10.7], ["static", 9.42]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 32.56], ["insect", 25.9], ["fart", 7.16]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 1.05, 0.86, 5.66, 3.03, 1.07, 15.91, 1.01, 0.49, 3.3, 1.36, 6.45, 3.34, 1.16, 0.04, 4.56, 1.58, 2.27, 1.23, 1.67, 2.47, 1.5, 1.18, 1.24, 2.82, 1.04, 0.59, 2.74, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/e72atw7hctA_filtered.json b/annotations_filtered/e72atw7hctA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bcaaeaa0e98babbd425795436d42d943d72ad15 --- /dev/null +++ b/annotations_filtered/e72atw7hctA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.12], [19.0, 20.78], [25.0, 25.49], [26.0, 26.4], [31.0, 40.66], [43.0, 43.75], [46.0, 53.52], [58.0, 58.95], [72.0, 79.02], [83.0, 85.4]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 38.78, 0.0, 48.56, 53.04], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 40.44], ["didgeridoo", 19.35], ["throbbing", 5.95]], null, [["throbbing", 53.35], ["hum", 32.86], ["music", 5.16]], null], "duration": [0.12, 1.78, 0.49, 0.4, 9.66, 0.75, 7.52, 0.95, 7.02, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/e77ybggTHHg_filtered.json b/annotations_filtered/e77ybggTHHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16e14bb5cb71753b057c3c7c0eeaeb2f590f3bcc --- /dev/null +++ b/annotations_filtered/e77ybggTHHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.21], [12.0, 13.86], [18.0, 18.28], [23.0, 28.98], [30.0, 37.56], [40.0, 43.17], [46.0, 59.22], [64.0, 68.35], [71.0, 72.54], [76.0, 79.24], [81.0, 82.44], [83.0, 85.8], [88.0, 90.75], [93.0, 107.01], [108.0, 110.29], [112.0, 122.89], [125.0, 126.59]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false], "silence_prob": [30.69, 0.0, 0.0, 35.87, 37.54, 33.65, 31.21, 35.39, 0.0, 34.07, 0.0, 37.83, 34.13, 32.55, 36.37, 32.49, 0.0], "audiomae_on_audioset": [[["hum", 41.09], ["throbbing", 23.24], ["music", 14.98]], null, null, [["music", 40.74], ["hum", 26.2], ["throbbing", 18.64]], [["music", 29.49], ["hum", 27.32], ["throbbing", 19.42]], [["music", 57.65], ["throbbing", 13.03], ["hum", 8.71]], [["music", 69.6], ["throbbing", 11.09], ["hum", 9.4]], [["music", 42.46], ["throbbing", 11.6], ["hum", 11.21]], null, [["music", 69.12], ["throbbing", 6.56], ["hum", 2.56]], null, [["music", 59.93], ["electronic music", 9.56], ["throbbing", 8.96]], [["music", 28.23], ["speech", 17.28], ["hum", 8.43]], [["music", 64.37], ["throbbing", 12.02], ["hum", 5.09]], [["music", 58.11], ["didgeridoo", 5.22], ["synthesizer", 3.89]], [["throbbing", 31.81], ["music", 26.61], ["hum", 23.37]], null], "duration": [7.21, 1.86, 0.28, 5.98, 7.56, 3.17, 13.22, 4.35, 1.54, 3.24, 1.44, 2.8, 2.75, 14.01, 2.29, 10.89, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/e7Efjj3_uME_filtered.json b/annotations_filtered/e7Efjj3_uME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..504a0f5e05e63263daf35e9a9a9584b5e82785ea --- /dev/null +++ b/annotations_filtered/e7Efjj3_uME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.46], [38.0, 39.18], [50.0, 50.19], [60.0, 60.05], [64.0, 65.01], [72.0, 73.18], [74.0, 74.29], [79.0, 79.15], [80.0, 80.23], [83.0, 84.4], [85.0, 85.67], [88.0, 101.92], [103.0, 103.03], [104.0, 104.62], [106.0, 106.05], [108.0, 108.95], [113.0, 113.48]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["didgeridoo", 10.6], ["hum", 10.19], ["music", 8.2]], null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 27.78], ["moo", 21.77], ["cattle, bovinae", 20.36]], null, null, null, null, null], "duration": [9.46, 1.18, 0.19, 0.05, 1.01, 1.18, 0.29, 0.15, 0.23, 1.4, 0.67, 13.92, 0.03, 0.62, 0.05, 0.95, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/e7X01_j_oDA_filtered.json b/annotations_filtered/e7X01_j_oDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6217e9fb33526a7d40a6e63e14fb62ca90d92714 --- /dev/null +++ b/annotations_filtered/e7X01_j_oDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.42], [7.0, 17.42], [19.0, 28.41], [29.0, 30.48], [33.0, 33.07], [34.0, 39.8], [40.0, 40.86], [43.0, 46.16], [48.0, 49.49], [52.0, 54.89], [55.0, 65.08], [67.0, 74.49], [76.0, 80.32], [81.0, 86.53], [95.0, 95.88], [98.0, 101.49], [102.0, 104.28], [106.0, 111.0], [113.0, 115.75]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [63.96, 32.11, 81.89, 0.0, 0.0, 57.81, 0.0, 34.57, 0.0, 38.42, 71.72, 38.26, 31.92, 99.4, 0.0, 53.65, 48.91, 52.27, 53.4], "audiomae_on_audioset": [null, [["music", 41.95], ["hum", 7.93], ["synthesizer", 7.74]], null, null, null, null, null, [["sidetone", 67.43], ["speech", 13.52], ["boing", 11.32]], null, [["noise", 27.02], ["speech", 24.35], ["radio", 17.16]], null, [["music", 62.41], ["musical instrument", 9.22], ["synthesizer", 7.75]], [["music", 34.26], ["sound effect", 6.29], ["cacophony", 2.92]], null, null, null, [["music", 60.43], ["synthesizer", 8.61], ["musical instrument", 5.81]], null, null], "duration": [2.42, 10.42, 9.41, 1.48, 0.07, 5.8, 0.86, 3.16, 1.49, 2.89, 10.08, 7.49, 4.32, 5.53, 0.88, 3.49, 2.28, 5.0, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/e7dbge0Zk5A_filtered.json b/annotations_filtered/e7dbge0Zk5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4667656469cc13c683ad2356cdba6e8334c01856 --- /dev/null +++ b/annotations_filtered/e7dbge0Zk5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 79.83], [81.0, 95.72], [96.0, 96.79], [97.0, 100.25], [100.0, 111.86], [113.0, 115.32], [116.0, 116.48], [118.0, 118.44], [124.0, 124.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.1, 0.0, 69.61, 50.41, 92.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 64.32], ["buzz", 7.43], ["electric shaver, electric razor", 3.78]], null, null, null, null, null, null, null], "duration": [36.83, 14.72, 0.79, 3.25, 11.86, 2.32, 0.48, 0.44, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/e7qjmOp9G34_filtered.json b/annotations_filtered/e7qjmOp9G34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c2f9bd802ffed71bd588d578847a61db7a6f522 --- /dev/null +++ b/annotations_filtered/e7qjmOp9G34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 51.98], [54.0, 80.22], [81.0, 85.62], [87.0, 88.48], [90.0, 90.22], [96.0, 97.8], [99.0, 107.5], [110.0, 111.82], [115.0, 125.29], [127.0, 130.92], [131.0, 136.7], [137.0, 139.85], [140.0, 141.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 32.25, 37.76, 0.0, 0.0, 0.0, 30.35, 0.0, 29.97, 40.45, 40.59, 44.01, 0.0], "audiomae_on_audioset": [null, [["music", 38.4], ["throbbing", 25.24], ["hum", 22.43]], [["music", 58.09], ["throbbing", 10.74], ["hum", 6.82]], null, null, null, [["throbbing", 55.86], ["hum", 17.57], ["music", 11.31]], null, [["speech", 42.21], ["music", 17.63], ["throbbing", 12.82]], [["music", 28.99], ["throbbing", 23.65], ["hum", 14.09]], [["throbbing", 24.47], ["hum", 23.09], ["music", 16.9]], [["music", 37.44], ["throbbing", 19.49], ["hum", 12.31]], null], "duration": [47.98, 26.22, 4.62, 1.48, 0.22, 1.8, 8.5, 1.82, 10.29, 3.92, 5.7, 2.85, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/e80zdJ6pWlI_filtered.json b/annotations_filtered/e80zdJ6pWlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..573ea4c1b1d99d488122c051e5bcb2ab5e65d138 --- /dev/null +++ b/annotations_filtered/e80zdJ6pWlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 40.68], [44.0, 83.86]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [35.68, 39.86]} \ No newline at end of file diff --git a/annotations_filtered/e89qDsf6Q3g_filtered.json b/annotations_filtered/e89qDsf6Q3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c17ea25c372b930f29fc015a4491d6f608f1b50 --- /dev/null +++ b/annotations_filtered/e89qDsf6Q3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.46], [9.0, 9.95], [24.0, 33.0], [35.0, 35.77], [37.0, 37.12], [38.0, 38.87], [40.0, 40.22], [41.0, 41.72], [42.0, 43.09], [44.0, 45.44], [47.0, 48.47], [52.0, 52.24], [53.0, 59.34], [60.0, 60.71], [62.0, 62.33], [63.0, 64.49], [67.0, 67.9], [80.0, 80.3], [82.0, 82.12], [84.0, 85.06], [86.0, 87.88], [90.0, 90.9], [92.0, 93.85], [96.0, 97.24], [99.0, 100.48], [104.0, 104.04], [108.0, 107.94]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.94, 0.0, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 15.0], ["noise", 12.52], ["synthesizer", 11.84]], null, [["music", 37.67], ["effects unit", 11.98], ["gong", 11.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.46, 0.95, 9.0, 0.77, 0.12, 0.87, 0.22, 0.72, 1.09, 1.44, 1.47, 0.24, 6.34, 0.71, 0.33, 1.49, 0.9, 0.3, 0.12, 1.06, 1.88, 0.9, 1.85, 1.24, 1.48, 0.04, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/e8Bn6XVv9ew_filtered.json b/annotations_filtered/e8Bn6XVv9ew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f824c3eb131bf1c231d9af13c79b076a3beed179 --- /dev/null +++ b/annotations_filtered/e8Bn6XVv9ew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.86], [15.0, 15.36], [17.0, 18.12], [20.0, 21.39], [23.0, 25.0], [34.0, 36.15], [40.0, 44.49]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [31.91, 0.0, 0.0, 0.0, 31.11, 30.63, 30.61], "audiomae_on_audioset": [[["fly, housefly", 32.34], ["speech", 29.28], ["insect", 17.25]], null, null, null, [["music", 57.46], ["musical instrument", 6.89], ["guitar", 6.54]], [["music", 68.84], ["musical instrument", 3.91], ["electronic music", 3.75]], [["music", 79.92], ["throbbing", 2.45], ["electronic music", 1.75]]], "duration": [4.86, 0.36, 1.12, 1.39, 2.0, 2.15, 4.49]} \ No newline at end of file diff --git a/annotations_filtered/e8EAVtsvfxc_filtered.json b/annotations_filtered/e8EAVtsvfxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76e0d9b311f4e62772e0554e3b8360256662a226 --- /dev/null +++ b/annotations_filtered/e8EAVtsvfxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [11.0, 13.63], [15.0, 16.46], [22.0, 24.34], [25.0, 27.01], [28.0, 28.46], [31.0, 31.9], [33.0, 34.05], [35.0, 36.02], [40.0, 39.95], [50.0, 52.08], [56.0, 81.03], [84.0, 85.36], [86.0, 87.35], [89.0, 89.68], [91.0, 91.45], [93.0, 120.28], [121.0, 122.67], [125.0, 127.03], [128.0, 128.95], [131.0, 132.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.8, 0.0, 99.97, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 77.87, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 89.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 2.63, 1.46, 2.34, 2.01, 0.46, 0.9, 1.05, 1.02, -0.05, 2.08, 25.03, 1.36, 1.35, 0.68, 0.45, 27.28, 1.67, 2.03, 0.95, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/e8HRcYG3Ftg_filtered.json b/annotations_filtered/e8HRcYG3Ftg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee97e405b6071a75c42659036c4738cb9ff9f26 --- /dev/null +++ b/annotations_filtered/e8HRcYG3Ftg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.14], [23.0, 31.01], [33.0, 33.02], [60.0, 63.48], [64.0, 64.91], [66.0, 66.51], [69.0, 69.04], [75.0, 83.81], [85.0, 88.65], [90.0, 93.21], [97.0, 105.14], [106.0, 109.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.24, 0.0, 50.16, 0.0, 0.0, 0.0, 75.72, 59.59, 96.77, 89.19, 67.25], "audiomae_on_audioset": [null, [["speech", 54.04], ["snicker", 16.98], ["chuckle, chortle", 5.65]], null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 8.01, 0.02, 3.48, 0.91, 0.51, 0.04, 8.81, 3.65, 3.21, 8.14, 3.07]} \ No newline at end of file diff --git a/annotations_filtered/e8J56HbIyvc_filtered.json b/annotations_filtered/e8J56HbIyvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64f886aece91e9a5d244bf8fa6beb5ff877e8b68 --- /dev/null +++ b/annotations_filtered/e8J56HbIyvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [6.0, 6.56], [12.0, 12.8], [14.0, 14.99], [17.0, 18.64], [20.0, 20.73], [22.0, 22.64], [25.0, 26.2], [32.0, 38.45], [40.0, 41.86], [45.0, 45.54], [48.0, 48.3], [53.0, 53.64], [55.0, 55.83], [59.0, 59.83], [61.0, 61.38], [67.0, 67.91], [69.0, 69.9], [70.0, 71.0], [72.0, 74.17], [76.0, 77.9], [100.0, 102.49], [105.0, 105.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.56, 0.8, 0.99, 1.64, 0.73, 0.64, 1.2, 6.45, 1.86, 0.54, 0.3, 0.64, 0.83, 0.83, 0.38, 0.91, 0.9, 1.0, 2.17, 1.9, 2.49, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/e8i7WCXqJ94_filtered.json b/annotations_filtered/e8i7WCXqJ94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e46e25ef5784c2adeeee2260e438386717ca528 --- /dev/null +++ b/annotations_filtered/e8i7WCXqJ94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.28], [5.0, 5.7], [7.0, 7.35], [7.0, 16.28], [18.0, 20.33], [22.0, 22.89], [24.0, 24.7], [31.0, 31.26], [34.0, 34.53], [36.0, 37.52], [42.0, 42.96], [60.0, 61.65]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [44.55, 0.0, 0.0, 33.32, 38.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.76], ["hum", 12.29], ["throbbing", 11.86]], null, null, [["speech", 30.12], ["music", 27.77], ["hum", 13.09]], [["music", 44.26], ["speech", 19.03], ["hum", 3.15]], null, null, null, null, null, null, null], "duration": [2.28, 0.7, 0.35, 9.28, 2.33, 0.89, 0.7, 0.26, 0.53, 1.52, 0.96, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/e8mmLcViaGI_filtered.json b/annotations_filtered/e8mmLcViaGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75a76f1c053b2806581d5852ef6c7e2f4dd0c568 --- /dev/null +++ b/annotations_filtered/e8mmLcViaGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.13], [14.0, 14.66], [16.0, 16.39], [18.0, 18.76], [20.0, 20.43], [22.0, 22.57], [24.0, 24.07], [26.0, 26.97], [28.0, 34.15], [35.0, 35.4], [37.0, 58.13], [58.0, 59.46], [63.0, 64.67], [65.0, 66.55], [67.0, 67.8], [69.0, 86.49], [88.0, 96.96], [101.0, 101.82], [107.0, 107.32], [108.0, 108.24], [113.0, 113.59], [114.0, 114.67], [116.0, 119.65], [120.0, 120.43], [122.0, 123.04], [125.0, 131.04], [131.0, 139.23], [142.0, 143.72], [144.0, 144.64], [146.0, 146.57], [147.0, 147.73], [148.0, 150.23], [153.0, 159.29], [161.0, 162.13], [163.0, 163.46], [164.0, 164.64], [166.0, 166.8], [169.0, 169.7], [171.0, 173.79], [176.0, 181.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.8, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.48, 99.97, 0.0, 0.0, 0.0, 0.0, 94.07, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 45.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.59], ["ambient music", 29.37], ["singing bowl", 5.03]]], "duration": [3.13, 0.66, 0.39, 0.76, 0.43, 0.57, 0.07, 0.97, 6.15, 0.4, 21.13, 1.46, 1.67, 1.55, 0.8, 17.49, 8.96, 0.82, 0.32, 0.24, 0.59, 0.67, 3.65, 0.43, 1.04, 6.04, 8.23, 1.72, 0.64, 0.57, 0.73, 2.23, 6.29, 1.13, 0.46, 0.64, 0.8, 0.7, 2.79, 5.87]} \ No newline at end of file diff --git a/annotations_filtered/e96_1NxL9no_filtered.json b/annotations_filtered/e96_1NxL9no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2919183fa313e40ece60403dcc508101218f4c --- /dev/null +++ b/annotations_filtered/e96_1NxL9no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [9.0, 10.57], [12.0, 11.99], [13.0, 13.91], [17.0, 17.37], [20.0, 24.66], [33.0, 35.07], [37.0, 39.36], [43.0, 43.58], [45.0, 45.45], [47.0, 48.44], [49.0, 50.11], [54.0, 54.45], [58.0, 58.56], [59.0, 60.37], [61.0, 62.95], [65.0, 66.01], [71.0, 82.56], [84.0, 86.04], [87.0, 88.28], [92.0, 92.47], [93.0, 99.28], [100.0, 102.27], [115.0, 115.64], [116.0, 133.95], [138.0, 139.94], [141.0, 141.64], [143.0, 143.9], [154.0, 165.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 34.12, 33.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.34, 38.93, 0.0, 0.0, 32.85, 48.82, 0.0, 34.01, 0.0, 0.0, 0.0, 33.66], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 15.13], ["speech", 15.11], ["boing", 14.92]], [["music", 36.97], ["speech", 21.62], ["boing", 16.77]], null, null, null, null, null, null, null, null, null, [["music", 81.96], ["livestock, farm animals, working animals", 1.69], ["musical instrument", 1.47]], [["music", 50.34], ["speech", 9.22], ["oink", 7.07]], null, null, [["music", 29.97], ["livestock, farm animals, working animals", 13.03], ["animal", 7.64]], [["bleat", 14.17], ["owl", 13.46], ["speech", 13.45]], null, [["music", 82.37], ["hum", 2.29], ["speech", 1.82]], null, null, null, [["music", 33.85], ["livestock, farm animals, working animals", 14.9], ["moo", 9.37]]], "duration": [0.5, 1.57, -0.01, 0.91, 0.37, 4.66, 2.07, 2.36, 0.58, 0.45, 1.44, 1.11, 0.45, 0.56, 1.37, 1.95, 1.01, 11.56, 2.04, 1.28, 0.47, 6.28, 2.27, 0.64, 17.95, 1.94, 0.64, 0.9, 11.89]} \ No newline at end of file diff --git a/annotations_filtered/e9_4oS3hTPk_filtered.json b/annotations_filtered/e9_4oS3hTPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e94a3dd15c22a68715517a35a499504b69a4e8c --- /dev/null +++ b/annotations_filtered/e9_4oS3hTPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [10.0, 9.88], [12.0, 14.4], [16.0, 16.75], [18.0, 19.55], [20.0, 21.78], [23.0, 25.41], [27.0, 27.82], [29.0, 30.05], [32.0, 32.43], [34.0, 39.26], [48.0, 106.19], [108.0, 109.04], [110.0, 110.51], [112.0, 112.31], [113.0, 115.6], [120.0, 122.64], [126.0, 125.83], [127.0, 128.68], [133.0, 134.69], [138.0, 139.94], [142.0, 143.94], [145.0, 145.72], [147.0, 148.74], [150.0, 151.34], [153.0, 155.38]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 44.66, 0.0, 0.0, 0.0, 33.72, 0.0, 0.0, 0.0, 0.0, 47.74, 45.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 28.05], ["speech", 16.41], ["hum", 14.15]], null, null, null, [["music", 32.58], ["speech", 29.92], ["hum", 7.6]], null, null, null, null, [["speech", 48.76], ["singing bowl", 14.51], ["gong", 7.26]], [["speech", 33.68], ["sidetone", 33.62], ["music", 3.02]], null, null, null, null, null, null, null, null, null], "duration": [0.92, -0.12, 2.4, 0.75, 1.55, 1.78, 2.41, 0.82, 1.05, 0.43, 5.26, 58.19, 1.04, 0.51, 0.31, 2.6, 2.64, -0.17, 1.68, 1.69, 1.94, 1.94, 0.72, 1.74, 1.34, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/e9cysHm38Kg_filtered.json b/annotations_filtered/e9cysHm38Kg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..231d53922703e74d64752a4c6efafa9a88d7ca49 --- /dev/null +++ b/annotations_filtered/e9cysHm38Kg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [9.0, 10.61], [11.0, 13.42], [16.0, 19.21], [20.0, 22.23], [24.0, 26.15], [32.0, 32.36], [34.0, 33.83], [35.0, 35.51], [38.0, 38.3], [41.0, 41.27], [44.0, 46.04], [47.0, 47.21], [50.0, 50.45], [55.0, 56.03], [58.0, 58.11], [59.0, 61.2], [62.0, 63.44], [64.0, 66.66], [68.0, 69.09], [73.0, 73.6], [88.0, 88.55], [90.0, 92.06], [96.0, 96.77]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.84, 34.07, 51.23, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 99.76, 0.0, 0.0, 0.0, 72.9, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.47], ["music", 7.96], ["vehicle", 4.39]], [["speech", 32.37], ["music", 14.0], ["sidetone", 6.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 1.61, 2.42, 3.21, 2.23, 2.15, 0.36, -0.17, 0.51, 0.3, 0.27, 2.04, 0.21, 0.45, 1.03, 0.11, 2.2, 1.44, 2.66, 1.09, 0.6, 0.55, 2.06, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/e9t5ikxjAQ4_filtered.json b/annotations_filtered/e9t5ikxjAQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..875316ad04a34352108ec7993e2e6f2972e56a42 --- /dev/null +++ b/annotations_filtered/e9t5ikxjAQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 37.67], [40.0, 55.34], [56.0, 56.35], [58.0, 75.41], [79.0, 79.14]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 78.38, 0.0, 33.3, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.92], ["rumble", 10.38], ["livestock, farm animals, working animals", 5.72]], null], "duration": [1.67, 15.34, 0.35, 17.41, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/eA-V5wUcWos_filtered.json b/annotations_filtered/eA-V5wUcWos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08f07cc030232a21f05f3e84c29572d68f2d547b --- /dev/null +++ b/annotations_filtered/eA-V5wUcWos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.28], [18.0, 54.82], [59.0, 95.2], [95.0, 96.11], [104.0, 105.41], [106.0, 106.51], [108.0, 130.62], [131.0, 135.24]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [28.29, 0.0, 0.0, 0.0, 0.0, 0.0, 28.59, 29.02], "audiomae_on_audioset": [[["speech", 54.0], ["artillery fire", 9.21], ["explosion", 8.35]], null, null, null, null, null, [["eruption", 17.85], ["white noise", 7.54], ["livestock, farm animals, working animals", 6.92]], [["cattle, bovinae", 33.77], ["speech", 14.51], ["moo", 11.81]]], "duration": [8.28, 36.82, 36.2, 1.11, 1.41, 0.51, 22.62, 4.24]} \ No newline at end of file diff --git a/annotations_filtered/eAC2kNiKuEg_filtered.json b/annotations_filtered/eAC2kNiKuEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6169d05caa53ca068376259080b208f896206b21 --- /dev/null +++ b/annotations_filtered/eAC2kNiKuEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 55.19], [57.0, 67.41], [68.0, 69.13], [71.0, 71.47], [74.0, 80.37], [81.0, 82.12], [83.0, 87.88], [92.0, 94.53], [98.0, 112.48]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.82, 0.0, 0.0, 52.74, 0.0, 32.48, 37.24, 33.67], "audiomae_on_audioset": [null, [["music", 48.34], ["speech", 28.58], ["electronic music", 4.45]], null, null, null, null, [["music", 69.74], ["throbbing", 5.18], ["speech", 4.13]], [["music", 36.06], ["throbbing", 15.39], ["speech", 13.13]], [["music", 63.48], ["speech", 15.1], ["electronic music", 1.8]]], "duration": [38.19, 10.41, 1.13, 0.47, 6.37, 1.12, 4.88, 2.53, 14.48]} \ No newline at end of file diff --git a/annotations_filtered/eAp8Vm19uQU_filtered.json b/annotations_filtered/eAp8Vm19uQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a19b8330a184452b00433c61412dea0f6dc1ebf --- /dev/null +++ b/annotations_filtered/eAp8Vm19uQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 80.38], [83.0, 82.81], [84.0, 85.75], [86.0, 109.61], [113.0, 120.18], [120.0, 133.25]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.93, 29.9, 29.67], "audiomae_on_audioset": [null, null, null, [["music", 36.81], ["throbbing", 18.51], ["hum", 12.39]], [["hum", 43.1], ["throbbing", 37.64], ["music", 9.01]], [["music", 74.61], ["cacophony", 7.85], ["hum", 2.75]]], "duration": [0.38, -0.19, 1.75, 23.61, 7.18, 13.25]} \ No newline at end of file diff --git a/annotations_filtered/eAvVe92mi5k_filtered.json b/annotations_filtered/eAvVe92mi5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d15c6ed1acd3d42531790610f5093721d1195e58 --- /dev/null +++ b/annotations_filtered/eAvVe92mi5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.51], [8.0, 9.69], [48.0, 48.95], [56.0, 56.78], [60.0, 61.87], [76.0, 77.4], [81.0, 81.53], [96.0, 96.69], [104.0, 104.38], [105.0, 106.64], [113.0, 114.35], [118.0, 118.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.69, 0.95, 0.78, 1.87, 1.4, 0.53, 0.69, 0.38, 1.64, 1.35, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/eB-ldQkL--0_filtered.json b/annotations_filtered/eB-ldQkL--0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba67f7cc920ae313d9c8552b611bbcc7b11e339f --- /dev/null +++ b/annotations_filtered/eB-ldQkL--0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.54], [7.0, 15.18], [19.0, 27.63], [31.0, 31.45], [35.0, 36.73], [38.0, 46.72], [51.0, 52.47], [53.0, 54.04], [57.0, 62.09], [64.0, 70.06], [72.0, 75.05], [76.0, 79.37], [81.0, 82.16], [83.0, 83.71], [86.0, 116.67], [118.0, 118.34], [126.0, 135.78], [138.0, 139.45], [140.0, 150.04], [153.0, 152.95], [156.0, 156.66], [157.0, 158.65], [166.0, 169.16], [170.0, 170.65], [183.0, 184.03], [187.0, 188.33], [189.0, 193.35], [196.0, 201.21], [203.0, 203.1], [205.0, 206.71], [207.0, 208.84], [218.0, 234.55], [235.0, 236.7], [240.0, 240.21]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.97, 31.23, 0.0, 0.0, 30.28, 0.0, 0.0, 30.22, 30.45, 31.83, 29.39, 0.0, 0.0, 0.0, 0.0, 31.07, 0.0, 29.74, 0.0, 0.0, 0.0, 30.19, 0.0, 0.0, 0.0, 28.68, 28.36, 0.0, 0.0, 0.0, 28.31, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.81], ["music", 23.73], ["sidetone", 11.04]], [["speech", 29.26], ["music", 24.22], ["throbbing", 17.9]], null, null, [["throbbing", 48.4], ["music", 24.91], ["hum", 17.83]], null, null, [["speech", 39.22], ["music", 12.57], ["throbbing", 7.95]], [["throbbing", 46.64], ["hum", 21.88], ["music", 14.31]], [["throbbing", 26.87], ["hum", 21.73], ["music", 20.72]], [["music", 32.64], ["speech", 22.99], ["didgeridoo", 13.37]], null, null, null, null, [["music", 70.28], ["throbbing", 11.22], ["hum", 2.13]], null, [["music", 45.76], ["speech", 31.33], ["didgeridoo", 12.5]], null, null, null, [["speech", 45.04], ["music", 29.92], ["throbbing", 7.63]], null, null, null, [["music", 60.89], ["throbbing", 11.13], ["hum", 7.15]], [["music", 44.9], ["speech", 35.9], ["electronic music", 2.51]], null, null, null, [["buzz", 20.94], ["electric shaver, electric razor", 10.85], ["music", 8.22]], null, null], "duration": [0.54, 8.18, 8.63, 0.45, 1.73, 8.72, 1.47, 1.04, 5.09, 6.06, 3.05, 3.37, 1.16, 0.71, 30.67, 0.34, 9.78, 1.45, 10.04, -0.05, 0.66, 1.65, 3.16, 0.65, 1.03, 1.33, 4.35, 5.21, 0.1, 1.71, 1.84, 16.55, 1.7, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/eB46dRO0YZ8_filtered.json b/annotations_filtered/eB46dRO0YZ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09f49f25d0a8b5ab543f72ca78237df1978d9c5 --- /dev/null +++ b/annotations_filtered/eB46dRO0YZ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.37], [30.0, 30.82], [32.0, 35.63], [39.0, 40.32], [41.0, 42.52], [44.0, 44.66], [45.0, 56.89], [58.0, 61.18], [62.0, 65.31], [68.0, 78.71], [80.0, 80.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 97.0, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [4.37, 0.82, 3.63, 1.32, 1.52, 0.66, 11.89, 3.18, 3.31, 10.71, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/eBE2Wgz32nY_filtered.json b/annotations_filtered/eBE2Wgz32nY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e68a1293434b95e52f977e0b6a95facdd0544ca --- /dev/null +++ b/annotations_filtered/eBE2Wgz32nY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.77], [12.0, 48.42], [50.0, 68.12], [73.0, 73.82], [80.0, 79.71], [81.0, 83.29], [86.0, 87.25], [91.0, 93.55], [96.0, 96.63], [100.0, 104.95], [111.0, 119.8], [121.0, 133.3]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [32.15, 0.0, 31.96, 0.0, 0.0, 47.9, 0.0, 47.46, 0.0, 33.31, 33.9, 32.44], "audiomae_on_audioset": [[["hum", 37.9], ["throbbing", 22.37], ["mains hum", 22.33]], null, [["music", 56.63], ["speech", 7.85], ["siren", 3.09]], null, null, [["music", 53.62], ["didgeridoo", 7.06], ["speech", 3.34]], null, [["cattle, bovinae", 43.96], ["moo", 18.79], ["whale vocalization", 18.55]], null, [["speech", 59.18], ["music", 12.43], ["whale vocalization", 12.11]], [["music", 69.54], ["didgeridoo", 7.82], ["musical instrument", 2.89]], [["music", 64.74], ["didgeridoo", 11.28], ["hum", 3.8]]], "duration": [7.77, 36.42, 18.12, 0.82, -0.29, 2.29, 1.25, 2.55, 0.63, 4.95, 8.8, 12.3]} \ No newline at end of file diff --git a/annotations_filtered/eBU1T2DdLsk_filtered.json b/annotations_filtered/eBU1T2DdLsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afbecc1a612e7238bf117616d489ddd20efe9900 --- /dev/null +++ b/annotations_filtered/eBU1T2DdLsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 44.93], [45.0, 45.35], [45.0, 52.34], [52.0, 61.91], [62.0, 62.67], [63.0, 63.22], [64.0, 69.16], [70.0, 70.48], [73.0, 72.96], [74.0, 83.1], [85.0, 85.35], [89.0, 90.78]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 0.0, 38.22, 61.67, 0.0, 0.0, 80.82, 0.0, 0.0, 97.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.84], ["theremin", 17.78], ["didgeridoo", 9.08]], null, null, null, null, null, null, null, null, null], "duration": [12.93, 0.35, 7.34, 9.91, 0.67, 0.22, 5.16, 0.48, -0.04, 9.1, 0.35, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/eBVqcDJbl5A_filtered.json b/annotations_filtered/eBVqcDJbl5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4894fba56aa44d7e80973fd24f4c4b51d30397e1 --- /dev/null +++ b/annotations_filtered/eBVqcDJbl5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.97], [21.0, 31.97], [35.0, 46.01], [50.0, 61.35], [62.0, 63.44], [65.0, 77.89], [78.0, 91.17], [92.0, 100.53], [103.0, 114.05], [119.0, 119.52], [122.0, 122.71], [125.0, 129.22], [135.0, 138.74], [140.0, 141.17], [141.0, 146.2], [147.0, 153.55], [158.0, 161.64]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 32.23, 30.83, 31.32, 0.0, 62.27, 39.11, 31.67, 68.41, 0.0, 0.0, 59.07, 34.0, 0.0, 32.56, 36.26, 31.68], "audiomae_on_audioset": [null, [["mains hum", 37.19], ["hum", 34.01], ["music", 14.56]], [["music", 45.39], ["electronic music", 7.23], ["cacophony", 5.57]], [["buzz", 39.63], ["electric shaver, electric razor", 37.1], ["speech", 8.44]], null, null, [["hum", 71.31], ["mains hum", 12.63], ["throbbing", 8.77]], [["music", 32.65], ["hum", 16.51], ["breaking", 7.69]], null, null, null, null, [["music", 39.99], ["theremin", 34.58], ["musical instrument", 5.54]], null, [["music", 30.6], ["didgeridoo", 19.83], ["theremin", 17.95]], [["music", 39.37], ["theremin", 20.95], ["musical instrument", 7.53]], [["music", 30.66], ["theremin", 18.33], ["noise", 10.59]]], "duration": [0.97, 10.97, 11.01, 11.35, 1.44, 12.89, 13.17, 8.53, 11.05, 0.52, 0.71, 4.22, 3.74, 1.17, 5.2, 6.55, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/eBxVWEnuSC0_filtered.json b/annotations_filtered/eBxVWEnuSC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21bb5d9540c1240c741ad3e91a536e62ad87b1ae --- /dev/null +++ b/annotations_filtered/eBxVWEnuSC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [6.0, 6.34], [8.0, 10.29], [11.0, 13.19], [14.0, 24.22], [28.0, 28.63], [30.0, 33.12], [35.0, 37.47], [38.0, 40.71], [42.0, 42.03], [50.0, 50.73], [52.0, 53.91], [59.0, 59.12], [62.0, 63.93], [71.0, 71.69], [73.0, 77.08], [80.0, 81.4], [85.0, 93.7], [96.0, 96.75], [99.0, 100.38], [105.0, 115.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 72.75, 59.24, 69.2, 0.0, 84.07, 88.1, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 30.77, 0.0, 0.0, 30.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.4], ["explosion", 18.38], ["burst, pop", 10.78]], null, null, [["music", 47.29], ["hum", 6.12], ["electronic music", 4.31]]], "duration": [0.08, 0.34, 2.29, 2.19, 10.22, 0.63, 3.12, 2.47, 2.71, 0.03, 0.73, 1.91, 0.12, 1.93, 0.69, 4.08, 1.4, 8.7, 0.75, 1.38, 10.59]} \ No newline at end of file diff --git a/annotations_filtered/eC2O1zsfn2c_filtered.json b/annotations_filtered/eC2O1zsfn2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5013c36800b0fcc5639fbee55a6d8c8857da639 --- /dev/null +++ b/annotations_filtered/eC2O1zsfn2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.19], [10.0, 11.03], [14.0, 19.25], [23.0, 23.11], [25.0, 29.98], [34.0, 33.78], [34.0, 34.77], [37.0, 49.87], [53.0, 53.0], [56.0, 56.17], [58.0, 64.03], [66.0, 67.39], [68.0, 69.72], [71.0, 71.1], [73.0, 75.2], [76.0, 76.2], [79.0, 80.06], [81.0, 83.32], [88.0, 89.06], [93.0, 93.61], [100.0, 101.51], [102.0, 102.63], [106.0, 106.74], [107.0, 107.77], [110.0, 110.0], [110.0, 110.76], [117.0, 117.59], [119.0, 124.71], [126.0, 128.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 0.0, 95.51, 0.0, 65.79, 0.0, 0.0, 36.9, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.45], ["synthesizer", 10.43], ["musical instrument", 5.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.19, 1.03, 5.25, 0.11, 4.98, -0.22, 0.77, 12.87, 0.0, 0.17, 6.03, 1.39, 1.72, 0.1, 2.2, 0.2, 1.06, 2.32, 1.06, 0.61, 1.51, 0.63, 0.74, 0.77, 0.0, 0.76, 0.59, 5.71, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/eCKRI2wEw7I_filtered.json b/annotations_filtered/eCKRI2wEw7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..227e3910fcd0fa0860bcc215030f95a0ba079599 --- /dev/null +++ b/annotations_filtered/eCKRI2wEw7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [10.0, 11.64], [13.0, 14.61], [23.0, 24.39], [25.0, 34.21], [36.0, 37.56], [38.0, 39.28], [44.0, 52.1], [53.0, 53.55], [54.0, 54.23], [55.0, 56.05], [57.0, 58.48], [59.0, 61.7], [62.0, 64.94], [66.0, 67.78], [72.0, 73.74], [75.0, 75.0], [76.0, 77.46], [79.0, 80.0], [81.0, 81.89], [89.0, 90.73], [94.0, 96.74], [98.0, 98.29], [103.0, 108.65], [121.0, 121.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 0.0, 42.51, 43.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 0.0, 38.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 74.95], ["electronic music", 3.68], ["throbbing", 2.89]], null, null, null, null, [["music", 64.02], ["hum", 6.64], ["mains hum", 3.94]], [["music", 31.15], ["speech", 25.48], ["singing bowl", 16.89]], null, null, null, null, null, null, null, null, null, [["hum", 34.81], ["speech", 26.16], ["throbbing", 12.96]], null], "duration": [0.38, 1.64, 1.61, 1.39, 9.21, 1.56, 1.28, 8.1, 0.55, 0.23, 1.05, 1.48, 2.7, 2.94, 1.78, 1.74, 0.0, 1.46, 1.0, 0.89, 1.73, 2.74, 0.29, 5.65, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/eCQIRkboAM4_filtered.json b/annotations_filtered/eCQIRkboAM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a2b4db003f55df49fdf4808a6eff4584e141b96 --- /dev/null +++ b/annotations_filtered/eCQIRkboAM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.05], [10.0, 12.87], [14.0, 15.15], [21.0, 22.13], [26.0, 30.7], [32.0, 46.08], [51.0, 53.7], [55.0, 55.63], [62.0, 64.12], [67.0, 69.35], [80.0, 81.01], [89.0, 95.3], [98.0, 99.87], [105.0, 105.83], [115.0, 147.73], [152.0, 155.12]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [38.76, 37.25, 0.0, 0.0, 38.12, 37.32, 37.44, 0.0, 39.77, 32.16, 0.0, 41.89, 0.0, 0.0, 0.0, 30.39], "audiomae_on_audioset": [[["music", 53.15], ["speech", 21.35], ["effects unit", 6.33]], [["music", 53.0], ["guitar", 12.46], ["musical instrument", 5.04]], null, null, [["music", 67.41], ["synthesizer", 9.86], ["musical instrument", 5.2]], [["music", 50.6], ["synthesizer", 23.82], ["musical instrument", 7.51]], [["music", 13.97], ["singing bowl", 13.0], ["tuning fork", 10.59]], null, [["music", 65.21], ["guitar", 4.47], ["effects unit", 4.4]], [["music", 52.08], ["speech", 15.9], ["musical instrument", 9.29]], null, [["music", 62.37], ["speech", 11.09], ["guitar", 6.82]], null, null, null, [["music", 54.3], ["synthesizer", 15.93], ["ambient music", 6.34]]], "duration": [4.05, 2.87, 1.15, 1.13, 4.7, 14.08, 2.7, 0.63, 2.12, 2.35, 1.01, 6.3, 1.87, 0.83, 32.73, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/eCS7qPuOXQI_filtered.json b/annotations_filtered/eCS7qPuOXQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ce233792bc1261748f1a97871388905f9f7f058 --- /dev/null +++ b/annotations_filtered/eCS7qPuOXQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [5.0, 17.2], [30.0, 30.97], [31.0, 31.95], [36.0, 39.63], [42.0, 44.36], [61.0, 62.07], [63.0, 63.46], [66.0, 66.41], [71.0, 71.76], [76.0, 76.81], [78.0, 80.55], [89.0, 91.79]], "keep_status": [false, true, false, false, true, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 35.33, 0.0, 0.0, 33.75, 33.74, 0.0, 0.0, 0.0, 0.0, 0.0, 38.37, 43.28], "audiomae_on_audioset": [null, [["music", 57.62], ["chant", 6.54], ["musical instrument", 3.82]], null, null, [["whale vocalization", 18.73], ["roaring cats (lions, tigers)", 8.45], ["animal", 8.16]], [["chant", 42.87], ["music", 11.97], ["choir", 3.42]], null, null, null, null, null, [["speech", 18.79], ["music", 9.42], ["hum", 8.89]], [["speech", 42.08], ["aircraft", 8.18], ["vehicle", 5.9]]], "duration": [0.48, 12.2, 0.97, 0.95, 3.63, 2.36, 1.07, 0.46, 0.41, 0.76, 0.81, 2.55, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/eCXv9LnSKeA_filtered.json b/annotations_filtered/eCXv9LnSKeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e936c29e2c4024554f1516b7ee9399311022394 --- /dev/null +++ b/annotations_filtered/eCXv9LnSKeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.92], [10.0, 10.27], [13.0, 24.41], [35.0, 35.34], [38.0, 63.19], [65.0, 75.14], [76.0, 90.21], [91.0, 112.7], [113.0, 114.18], [115.0, 116.23], [119.0, 127.41], [130.0, 130.57], [132.0, 132.22], [137.0, 148.47], [151.0, 151.56], [155.0, 162.38], [166.0, 165.99], [169.0, 170.82]], "keep_status": [false, false, true, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [42.93, 0.0, 31.34, 0.0, 28.81, 29.95, 29.15, 29.04, 0.0, 0.0, 28.68, 0.0, 0.0, 29.59, 0.0, 28.88, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.06], ["throbbing", 22.63], ["hum", 9.01]], null, [["music", 39.02], ["speech", 12.89], ["explosion", 11.08]], null, [["music", 23.12], ["vehicle", 12.04], ["speech", 6.82]], [["speech", 33.25], ["cowbell", 15.15], ["music", 13.66]], [["speech", 36.46], ["livestock, farm animals, working animals", 9.13], ["music", 9.08]], [["music", 46.45], ["hum", 11.31], ["speech", 8.17]], null, null, [["music", 63.81], ["cacophony", 5.79], ["hum", 4.22]], null, null, [["speech", 42.39], ["music", 27.55], ["explosion", 6.22]], null, [["speech", 47.69], ["music", 11.27], ["reverberation", 5.23]], null, null], "duration": [3.92, 0.27, 11.41, 0.34, 25.19, 10.14, 14.21, 21.7, 1.18, 1.23, 8.41, 0.57, 0.22, 11.47, 0.56, 7.38, -0.01, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/eC_Ua1svsSE_filtered.json b/annotations_filtered/eC_Ua1svsSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280d76f34c27169b133c4834228710c291821cb9 --- /dev/null +++ b/annotations_filtered/eC_Ua1svsSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.37], [7.0, 7.18], [15.0, 15.25], [18.0, 22.3], [24.0, 24.36], [25.0, 26.86], [28.0, 29.51], [30.0, 32.7], [36.0, 36.91], [42.0, 42.94], [46.0, 48.49], [50.0, 52.32], [53.0, 54.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [31.96, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 43.4, 45.92, 0.0], "audiomae_on_audioset": [[["hum", 34.97], ["mains hum", 26.35], ["rumble", 8.84]], null, null, null, null, null, null, null, null, null, [["music", 47.35], ["guitar", 10.56], ["musical instrument", 8.22]], [["music", 69.23], ["musical instrument", 6.64], ["guitar", 5.47]], null], "duration": [2.37, 0.18, 0.25, 4.3, 0.36, 1.86, 1.51, 2.7, 0.91, 0.94, 2.49, 2.32, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/eCdRFMp8Xwo_filtered.json b/annotations_filtered/eCdRFMp8Xwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8db10cc4c567bd2a00333536342374b890872fb2 --- /dev/null +++ b/annotations_filtered/eCdRFMp8Xwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 40.41]], "keep_status": [false], "silence_prob": [100.0], "audiomae_on_audioset": [null], "duration": [26.41]} \ No newline at end of file diff --git a/annotations_filtered/eCfvE03ufF8_filtered.json b/annotations_filtered/eCfvE03ufF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d96182673acb26412faf5d36751f60f14864a0e8 --- /dev/null +++ b/annotations_filtered/eCfvE03ufF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.15], [11.0, 11.45], [12.0, 18.03], [21.0, 22.89], [23.0, 26.62], [27.0, 27.7], [30.0, 39.28], [41.0, 52.0], [52.0, 52.07], [60.0, 65.62], [67.0, 70.12], [77.0, 77.58], [78.0, 78.71], [82.0, 82.56], [91.0, 91.52], [99.0, 99.42], [101.0, 101.31], [105.0, 105.0], [106.0, 106.37], [106.0, 106.42], [108.0, 108.85]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.39, 0.0, 84.07, 0.0, 35.76, 35.47, 0.0, 32.83, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 80.47], ["theremin", 3.45], ["video game music", 2.71]], [["music", 79.32], ["scary music", 4.85], ["video game music", 3.48]], null, [["music", 42.39], ["musical instrument", 6.46], ["organ", 4.59]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 0.45, 6.03, 1.89, 3.62, 0.7, 9.28, 11.0, 0.07, 5.62, 3.12, 0.58, 0.71, 0.56, 0.52, 0.42, 0.31, 0.0, 0.37, 0.42, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/eCvY-ualWwY_filtered.json b/annotations_filtered/eCvY-ualWwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f85a3b82dbd0f70d33c13d3189fbc26cb4ab038 --- /dev/null +++ b/annotations_filtered/eCvY-ualWwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 47.9], [50.0, 78.04], [82.0, 88.59], [98.0, 181.3]], "keep_status": [true, false, true, false], "silence_prob": [28.85, 28.38, 28.41, 0.0], "audiomae_on_audioset": [[["music", 30.89], ["buzz", 12.74], ["hum", 6.82]], [["music", 29.11], ["mains hum", 26.39], ["hum", 21.4]], [["music", 45.49], ["hum", 7.48], ["whale vocalization", 6.96]], null], "duration": [12.9, 28.04, 6.59, 83.3]} \ No newline at end of file diff --git a/annotations_filtered/eD4l8wpbrRI_filtered.json b/annotations_filtered/eD4l8wpbrRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d694e186b5eebc1d5f68a24a3bba45f4938a47d --- /dev/null +++ b/annotations_filtered/eD4l8wpbrRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.6], [36.0, 36.61], [41.0, 40.71], [42.0, 42.48], [60.0, 60.29], [64.0, 64.64], [68.0, 68.23], [69.0, 69.5], [87.0, 86.95], [90.0, 91.03], [99.0, 99.84], [105.0, 104.62], [114.0, 115.16], [119.0, 119.57], [121.0, 122.35], [123.0, 128.11], [129.0, 130.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.6, 0.61, -0.29, 0.48, 0.29, 0.64, 0.23, 0.5, -0.05, 1.03, 0.84, -0.38, 1.16, 0.57, 1.35, 5.11, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/eDPbu2vNrWk_filtered.json b/annotations_filtered/eDPbu2vNrWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0061c1e1d3f93ebdc1de735ff0bd97a18daa61b7 --- /dev/null +++ b/annotations_filtered/eDPbu2vNrWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 108.09], [109.0, 147.19], [148.0, 152.86], [154.0, 158.41]], "keep_status": [true, false, true, true], "silence_prob": [43.3, 0.0, 47.74, 38.64], "audiomae_on_audioset": [[["hum", 25.53], ["mains hum", 15.2], ["music", 10.05]], null, [["music", 38.16], ["whale vocalization", 21.74], ["musical instrument", 3.92]], [["music", 16.52], ["speech", 16.14], ["hum", 13.92]]], "duration": [12.09, 38.19, 4.86, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/eDblDj6BISo_filtered.json b/annotations_filtered/eDblDj6BISo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72fd9757bb61db864b66dfa1e780834520c48624 --- /dev/null +++ b/annotations_filtered/eDblDj6BISo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.52], [4.0, 4.43], [7.0, 7.91], [9.0, 10.45], [11.0, 27.62], [29.0, 30.96], [32.0, 53.38], [54.0, 55.86], [57.0, 58.89], [60.0, 62.9], [64.0, 66.26], [70.0, 75.71], [78.0, 78.11], [78.0, 78.49], [81.0, 82.85], [84.0, 85.67], [86.0, 87.51], [89.0, 90.91], [93.0, 93.45], [95.0, 95.91], [97.0, 99.15], [100.0, 104.11], [106.0, 106.0], [109.0, 112.01], [114.0, 114.91], [115.0, 121.49], [123.0, 125.24], [126.0, 129.95], [132.0, 143.82], [148.0, 158.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 92.8, 0.0, 0.0, 95.51, 96.42, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 92.8, 0.0, 91.13, 0.0, 79.59, 90.95, 79.07, 61.18, 83.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.48, 0.43, 0.91, 1.45, 16.62, 1.96, 21.38, 1.86, 1.89, 2.9, 2.26, 5.71, 0.11, 0.49, 1.85, 1.67, 1.51, 1.91, 0.45, 0.91, 2.15, 4.11, 0.0, 3.01, 0.91, 6.49, 2.24, 3.95, 11.82, 10.87]} \ No newline at end of file diff --git a/annotations_filtered/eEUulOnl-n8_filtered.json b/annotations_filtered/eEUulOnl-n8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30fb8084c603ff99cad7132e3910b7c12ea329c1 --- /dev/null +++ b/annotations_filtered/eEUulOnl-n8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 64.32], [65.0, 97.29], [98.0, 119.91]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 41.34], "audiomae_on_audioset": [null, null, [["music", 69.85], ["hum", 6.55], ["throbbing", 6.45]]], "duration": [44.32, 32.29, 21.91]} \ No newline at end of file diff --git a/annotations_filtered/eFF1grhBvsE_filtered.json b/annotations_filtered/eFF1grhBvsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5a29835f56db664b3d3b9d33b67b3adce9a022 --- /dev/null +++ b/annotations_filtered/eFF1grhBvsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [8.0, 10.93], [11.0, 12.72], [13.0, 16.68], [18.0, 21.96], [24.0, 25.81], [30.0, 31.67], [38.0, 39.51], [53.0, 53.52], [56.0, 58.41], [60.0, 63.12], [73.0, 73.35], [76.0, 76.74], [85.0, 85.95], [87.0, 88.64], [90.0, 90.09], [96.0, 96.11], [107.0, 107.94], [117.0, 117.15], [119.0, 119.48], [131.0, 131.25], [134.0, 135.35], [136.0, 136.02], [137.0, 138.5], [142.0, 143.04], [150.0, 151.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.08, 0.0, 40.22, 100.0, 0.0, 0.0, 0.0, 0.0, 87.37, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 66.64], ["domestic animals, pets", 3.77], ["dog", 3.3]], null, null, null, null, null, null, [["speech", 38.72], ["fly, housefly", 14.21], ["mosquito", 13.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 2.93, 1.72, 3.68, 3.96, 1.81, 1.67, 1.51, 0.52, 2.41, 3.12, 0.35, 0.74, 0.95, 1.64, 0.09, 0.11, 0.94, 0.15, 0.48, 0.25, 1.35, 0.02, 1.5, 1.04, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/eFKh6cYmQ4M_filtered.json b/annotations_filtered/eFKh6cYmQ4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d740c56dd172567476e98af333b7f4e62d48d252 --- /dev/null +++ b/annotations_filtered/eFKh6cYmQ4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 119.3]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [53.3]} \ No newline at end of file diff --git a/annotations_filtered/eFd0VyfLf1M_filtered.json b/annotations_filtered/eFd0VyfLf1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e3e611c194dcdc5f193334b603519d915341050 --- /dev/null +++ b/annotations_filtered/eFd0VyfLf1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.83], [10.0, 9.86], [19.0, 20.12], [27.0, 26.94], [40.0, 45.05], [47.0, 49.94], [50.0, 62.28], [75.0, 75.56], [77.0, 79.3]], "keep_status": [false, false, false, false, true, false, false, false, true], "silence_prob": [31.71, 0.0, 0.0, 0.0, 48.61, 60.42, 31.56, 0.0, 41.52], "audiomae_on_audioset": [[["speech", 50.17], ["frog", 15.7], ["screaming", 11.58]], null, null, null, [["music", 52.48], ["trombone", 5.3], ["brass instrument", 5.26]], null, [["speech", 50.23], ["music", 20.16], ["synthesizer", 7.12]], null, [["fly, housefly", 28.7], ["music", 15.72], ["insect", 13.55]]], "duration": [6.83, -0.14, 1.12, -0.06, 5.05, 2.94, 12.28, 0.56, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/eFnw_27t9-o_filtered.json b/annotations_filtered/eFnw_27t9-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68d8387c540973b52f62d32dba211cbf8b3630e8 --- /dev/null +++ b/annotations_filtered/eFnw_27t9-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [8.0, 12.48], [15.0, 18.64], [25.0, 35.94], [43.0, 47.38], [52.0, 61.11], [62.0, 65.75], [67.0, 68.13], [70.0, 73.75], [79.0, 79.08], [83.0, 88.62]], "keep_status": [false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 30.81, 52.1, 31.27, 32.4, 32.68, 31.36, 0.0, 33.45, 0.0, 37.85], "audiomae_on_audioset": [null, [["hum", 35.95], ["throbbing", 22.81], ["mains hum", 22.16]], null, [["hum", 31.75], ["music", 22.07], ["mains hum", 18.82]], [["mains hum", 25.26], ["hum", 25.07], ["music", 19.71]], [["mains hum", 22.0], ["noise", 21.98], ["hum", 14.06]], [["music", 37.26], ["throbbing", 26.13], ["hum", 12.41]], null, [["fly, housefly", 29.9], ["music", 13.85], ["throbbing", 11.97]], null, [["music", 30.91], ["hum", 17.96], ["speech", 14.61]]], "duration": [0.83, 4.48, 3.64, 10.94, 4.38, 9.11, 3.75, 1.13, 3.75, 0.08, 5.62]} \ No newline at end of file diff --git a/annotations_filtered/eFs_YLy3Ld8_filtered.json b/annotations_filtered/eFs_YLy3Ld8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c2985943672cdfd4032e7adad9a53abd592bbb1 --- /dev/null +++ b/annotations_filtered/eFs_YLy3Ld8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 23.19], [24.0, 25.57], [40.0, 40.24], [41.0, 45.0], [48.0, 58.9], [64.0, 64.15], [66.0, 67.26], [68.0, 69.96], [72.0, 72.55], [74.0, 74.06], [78.0, 86.07], [95.0, 113.83], [115.0, 118.81], [121.0, 126.47], [130.0, 130.81]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [62.58, 0.0, 0.0, 36.22, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 49.22, 36.47, 39.37, 0.0], "audiomae_on_audioset": [null, null, null, [["chirp tone", 35.22], ["tuning fork", 14.96], ["music", 14.47]], [["music", 74.77], ["synthesizer", 3.42], ["electronic music", 2.47]], null, null, null, null, null, null, [["speech", 48.3], ["train", 11.48], ["music", 7.0]], [["hum", 37.57], ["mains hum", 10.51], ["throbbing", 9.48]], [["vehicle", 24.31], ["buzz", 7.95], ["aircraft", 7.03]], null], "duration": [10.19, 1.57, 0.24, 4.0, 10.9, 0.15, 1.26, 1.96, 0.55, 0.06, 8.07, 18.83, 3.81, 5.47, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/eG2Yo0l78tM_filtered.json b/annotations_filtered/eG2Yo0l78tM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..171f7b70a6d13ec8a62314e46331f7ec56a5dc37 --- /dev/null +++ b/annotations_filtered/eG2Yo0l78tM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.81], [14.0, 14.94], [16.0, 16.75], [24.0, 24.19], [33.0, 34.08], [35.0, 36.17], [37.0, 38.69], [40.0, 40.64], [41.0, 43.34], [47.0, 48.09], [53.0, 55.38], [59.0, 60.61], [65.0, 65.67], [71.0, 76.91], [82.0, 82.11], [82.0, 83.25], [88.0, 89.28], [97.0, 97.48], [113.0, 113.91], [115.0, 116.46], [118.0, 120.21], [124.0, 124.53], [125.0, 128.07], [134.0, 134.79], [139.0, 143.4], [146.0, 148.15], [154.0, 155.76]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 57.64, 0.0, 0.0, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 29.42, 0.0, 39.83, 39.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["chirp tone", 25.76], ["speech", 22.94], ["sidetone", 18.31]], null, null, null, null, [["music", 49.29], ["synthesizer", 9.16], ["drum machine", 7.46]], null, null, null, null, null, null, [["music", 74.92], ["grunt", 2.49], ["caw", 1.84]], null, [["music", 22.7], ["bleat", 13.71], ["livestock, farm animals, working animals", 9.2]], null, [["animal", 22.13], ["speech", 20.15], ["wild animals", 17.33]], [["speech", 57.31], ["dial tone", 9.27], ["sidetone", 4.63]], null], "duration": [0.81, 0.94, 0.75, 0.19, 1.08, 1.17, 1.69, 0.64, 2.34, 1.09, 2.38, 1.61, 0.67, 5.91, 0.11, 1.25, 1.28, 0.48, 0.91, 1.46, 2.21, 0.53, 3.07, 0.79, 4.4, 2.15, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/eG9QMl_w1pk_filtered.json b/annotations_filtered/eG9QMl_w1pk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae67ad8ada21e958c631060ecb8c50d9ff7cec4f --- /dev/null +++ b/annotations_filtered/eG9QMl_w1pk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [23.0, 23.89], [25.0, 26.5], [31.0, 33.44], [35.0, 36.37], [38.0, 41.01], [42.0, 46.28], [50.0, 51.92], [54.0, 55.48], [61.0, 63.61], [64.0, 66.09], [90.0, 89.68], [90.0, 93.45], [93.0, 93.5], [95.0, 95.32], [106.0, 106.08], [109.0, 112.8], [113.0, 113.71], [114.0, 114.34], [115.0, 115.4], [117.0, 118.1], [120.0, 119.85], [129.0, 129.54], [130.0, 130.38], [131.0, 131.45], [132.0, 132.33]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.75, 0.0, 35.78, 41.78, 0.0, 0.0, 90.43, 69.2, 0.0, 31.01, 0.0, 0.0, 0.0, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["howl", 22.62], ["canidae, dogs, wolves", 15.08], ["animal", 10.0]], [["speech", 47.15], ["whimper", 7.05], ["grunt", 4.05]], null, null, null, null, null, [["speech", 83.0], ["music", 6.68], ["boing", 3.63]], null, null, null, [["speech", 36.33], ["fly, housefly", 13.42], ["fart", 10.57]], null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.89, 1.5, 2.44, 1.37, 3.01, 4.28, 1.92, 1.48, 2.61, 2.09, -0.32, 3.45, 0.5, 0.32, 0.08, 3.8, 0.71, 0.34, 0.4, 1.1, -0.15, 0.54, 0.38, 0.45, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/eGJqzSFW9Zg_filtered.json b/annotations_filtered/eGJqzSFW9Zg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae884838cb8b27e1e2a383471cce8aa3eae3d745 --- /dev/null +++ b/annotations_filtered/eGJqzSFW9Zg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [6.0, 9.51], [13.0, 14.82], [16.0, 16.87], [18.0, 19.14], [20.0, 25.19], [26.0, 26.89], [28.0, 28.19], [36.0, 42.72], [45.0, 46.04], [46.0, 47.11], [48.0, 48.27], [49.0, 51.09], [53.0, 52.88], [53.0, 54.21], [58.0, 58.97], [65.0, 67.42], [71.0, 71.12], [83.0, 84.77], [89.0, 89.34], [91.0, 92.77], [94.0, 93.83], [94.0, 95.25], [96.0, 97.21], [98.0, 98.73], [105.0, 106.79], [107.0, 108.45], [111.0, 111.48], [112.0, 112.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.98, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 3.51, 1.82, 0.87, 1.14, 5.19, 0.89, 0.19, 6.72, 1.04, 1.11, 0.27, 2.09, -0.12, 1.21, 0.97, 2.42, 0.12, 1.77, 0.34, 1.77, -0.17, 1.25, 1.21, 0.73, 1.79, 1.45, 0.48, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/eGLC0vhemeA_filtered.json b/annotations_filtered/eGLC0vhemeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c7e0b269bab06f145453c3aa3a31668fdc1b4e8 --- /dev/null +++ b/annotations_filtered/eGLC0vhemeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 37.94], [41.0, 75.59], [77.0, 88.45], [91.0, 91.52], [92.0, 94.22], [94.0, 101.09], [103.0, 104.25], [104.0, 105.58], [107.0, 108.21], [108.0, 111.67], [112.0, 141.66], [143.0, 166.28], [167.0, 170.75]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false, true], "silence_prob": [31.38, 0.0, 29.41, 0.0, 33.0, 34.77, 0.0, 0.0, 0.0, 53.53, 31.08, 35.22, 36.15], "audiomae_on_audioset": [[["hum", 36.53], ["music", 14.65], ["throbbing", 14.64]], null, [["hum", 41.11], ["mains hum", 20.33], ["music", 16.98]], null, [["music", 64.41], ["gong", 11.93], ["ambient music", 6.85]], [["music", 28.48], ["pulse", 8.79], ["hum", 8.42]], null, null, null, null, [["hum", 30.54], ["music", 14.58], ["breaking", 12.9]], [["music", 58.41], ["crack", 8.6], ["electronic music", 4.14]], [["music", 28.43], ["throbbing", 15.32], ["hum", 10.56]]], "duration": [9.94, 34.59, 11.45, 0.52, 2.22, 7.09, 1.25, 1.58, 1.21, 3.67, 29.66, 23.28, 3.75]} \ No newline at end of file diff --git a/annotations_filtered/eGXnEeW_KdA_filtered.json b/annotations_filtered/eGXnEeW_KdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7523bd52a3a3436e47d6f4bdb672ecd7bdecc0c2 --- /dev/null +++ b/annotations_filtered/eGXnEeW_KdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.36], [10.0, 12.33], [21.0, 38.69], [47.0, 73.31], [80.0, 83.66], [85.0, 102.37]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 29.9, 30.5, 30.34, 29.92, 29.9], "audiomae_on_audioset": [null, [["cattle, bovinae", 40.9], ["livestock, farm animals, working animals", 25.47], ["moo", 25.28]], [["whale vocalization", 42.74], ["animal", 7.48], ["sidetone", 6.01]], [["music", 21.05], ["speech", 5.3], ["throbbing", 4.38]], [["cattle, bovinae", 44.53], ["livestock, farm animals, working animals", 31.29], ["moo", 20.86]], [["livestock, farm animals, working animals", 45.07], ["animal", 21.11], ["cattle, bovinae", 16.54]]], "duration": [1.36, 2.33, 17.69, 26.31, 3.66, 17.37]} \ No newline at end of file diff --git a/annotations_filtered/eGtDmvtBZQY_filtered.json b/annotations_filtered/eGtDmvtBZQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b9b33d67d8fa84b190452ac964d50474ec27f05 --- /dev/null +++ b/annotations_filtered/eGtDmvtBZQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.03], [26.0, 32.05], [38.0, 50.09], [51.0, 54.35], [56.0, 56.22], [66.0, 67.9], [77.0, 78.19], [79.0, 79.44], [90.0, 90.31], [90.0, 94.12], [96.0, 98.61], [99.0, 102.81], [113.0, 114.71], [127.0, 129.05], [131.0, 132.65], [133.0, 133.46], [142.0, 143.14], [144.0, 145.1]], "keep_status": [false, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [36.38, 38.49, 44.29, 39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 42.22, 47.94, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 49.29], ["speech", 15.07], ["boing", 9.39]], [["music", 18.53], ["thunk", 11.17], ["sound effect", 8.84]], [["music", 43.54], ["speech", 23.19], ["thunk", 5.3]], [["groan", 36.3], ["whack, thwack", 9.85], ["sound effect", 7.58]], null, null, null, null, null, [["music", 44.35], ["scratching (performance technique)", 16.27], ["speech", 10.86]], [["beatboxing", 34.35], ["grunt", 16.34], ["music", 7.74]], [["music", 27.32], ["whack, thwack", 18.49], ["thunk", 10.89]], null, null, null, null, null, null], "duration": [3.03, 6.05, 12.09, 3.35, 0.22, 1.9, 1.19, 0.44, 0.31, 4.12, 2.61, 3.81, 1.71, 2.05, 1.65, 0.46, 1.14, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/eGu2camh0WA_filtered.json b/annotations_filtered/eGu2camh0WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb550f4a157c3d972f3182432dab59191b7771cc --- /dev/null +++ b/annotations_filtered/eGu2camh0WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 43.66], [50.0, 63.21], [64.0, 79.02], [85.0, 87.72], [89.0, 117.02], [120.0, 134.45], [135.0, 134.89], [135.0, 145.25], [147.0, 156.57]], "keep_status": [false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 33.41, 31.88, 33.94, 30.89, 30.59, 0.0, 31.09, 34.56], "audiomae_on_audioset": [null, null, [["music", 60.36], ["musical instrument", 6.06], ["synthesizer", 5.93]], [["music", 37.36], ["trombone", 18.45], ["foghorn", 11.81]], [["music", 31.05], ["hum", 17.15], ["throbbing", 6.31]], [["music", 40.55], ["musical instrument", 6.31], ["cacophony", 6.2]], [["music", 54.44], ["didgeridoo", 13.69], ["musical instrument", 8.08]], null, [["music", 70.89], ["musical instrument", 4.43], ["theremin", 3.06]], [["music", 47.47], ["theremin", 24.66], ["synthesizer", 5.14]]], "duration": [0.47, 40.66, 13.21, 15.02, 2.72, 28.02, 14.45, -0.11, 10.25, 9.57]} \ No newline at end of file diff --git a/annotations_filtered/eH7EyPs_Va8_filtered.json b/annotations_filtered/eH7EyPs_Va8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..584a8556a340152b756b1033cb3f27a5e6f889e8 --- /dev/null +++ b/annotations_filtered/eH7EyPs_Va8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 19.87], [31.0, 31.21], [36.0, 72.94], [77.0, 85.31], [86.0, 103.08]], "keep_status": [false, false, false, false, false], "silence_prob": [30.81, 0.0, 0.0, 31.05, 30.4], "audiomae_on_audioset": [[["music", 53.29], ["throbbing", 19.22], ["hum", 6.88]], null, null, [["music", 70.26], ["throbbing", 2.76], ["electronic music", 2.75]], [["music", 78.83], ["musical instrument", 3.73], ["guitar", 3.24]]], "duration": [7.87, 0.21, 36.94, 8.31, 17.08]} \ No newline at end of file diff --git a/annotations_filtered/eHh6bwuPShw_filtered.json b/annotations_filtered/eHh6bwuPShw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcc41bf8309736a0fd05cf9e4729f613e0ac3c88 --- /dev/null +++ b/annotations_filtered/eHh6bwuPShw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.27], [41.0, 41.82], [45.0, 45.82], [47.0, 59.17], [60.0, 61.33]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.27, 0.82, 0.82, 12.17, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/eHpBhm4LMfw_filtered.json b/annotations_filtered/eHpBhm4LMfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d875d915489aedf35076667e15dd45f6fbc0726b --- /dev/null +++ b/annotations_filtered/eHpBhm4LMfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [3.0, 3.89], [10.0, 10.69], [12.0, 11.82], [21.0, 21.73], [27.0, 28.88], [29.0, 29.79], [50.0, 50.72], [51.0, 52.42]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.89, 0.69, -0.18, 0.73, 1.88, 0.79, 0.72, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/eHx-v7Xto7E_filtered.json b/annotations_filtered/eHx-v7Xto7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3507b01080be52c1db2222a1f5e1d235028e58 --- /dev/null +++ b/annotations_filtered/eHx-v7Xto7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.94], [4.0, 17.68], [19.0, 34.35], [35.0, 41.01], [42.0, 42.69], [43.0, 44.02], [48.0, 49.94], [52.0, 55.02], [56.0, 56.61], [59.0, 61.05], [63.0, 63.81], [65.0, 66.46], [68.0, 69.63], [70.0, 70.9], [74.0, 75.27], [76.0, 78.97], [80.0, 80.03], [87.0, 87.81], [89.0, 89.43], [92.0, 95.66], [96.0, 96.2], [96.0, 96.23], [96.0, 96.26], [96.0, 96.3], [96.0, 96.33], [96.0, 96.36], [96.0, 96.4], [96.0, 96.43], [97.0, 96.6], [97.0, 115.21], [119.0, 119.64], [122.0, 122.67]], "keep_status": [false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.69, 29.37, 29.58, 0.0, 0.0, 0.0, 44.52, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0, 0.0, 0.0, 32.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.05, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 35.58], ["speech", 27.96], ["explosion", 13.11]], [["music", 17.6], ["speech", 13.86], ["explosion", 9.94]], [["speech", 40.82], ["hum", 20.74], ["mains hum", 7.94]], null, null, null, [["speech", 32.63], ["hum", 15.73], ["throbbing", 12.3]], null, null, null, null, null, null, null, [["sheep", 13.79], ["speech", 12.43], ["music", 8.04]], null, null, null, [["sound effect", 21.71], ["thunk", 11.7], ["boing", 10.56]], null, null, null, null, null, null, null, null, null, [["speech", 78.4], ["whack, thwack", 3.84], ["smash, crash", 3.3]], null, null], "duration": [1.94, 13.68, 15.35, 6.01, 0.69, 1.02, 1.94, 3.02, 0.61, 2.05, 0.81, 1.46, 1.63, 0.9, 1.27, 2.97, 0.03, 0.81, 0.43, 3.66, 0.2, 0.23, 0.26, 0.3, 0.33, 0.36, 0.4, 0.43, -0.4, 18.21, 0.64, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/eI1dAmDZrZE_filtered.json b/annotations_filtered/eI1dAmDZrZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3332fcfa134e2d143b1cf275bfd94964c75b0ac --- /dev/null +++ b/annotations_filtered/eI1dAmDZrZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.53], [49.0, 49.98], [53.0, 53.11], [56.0, 58.08], [59.0, 61.08], [80.0, 79.81], [80.0, 91.23], [92.0, 92.6], [93.0, 94.31], [95.0, 96.11], [96.0, 103.6], [105.0, 115.16], [122.0, 122.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 87.37, 73.67, 0.0, 42.88, 0.0, 0.0, 0.0, 34.75, 34.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.06], ["music", 17.86], ["hum", 14.49]], null, null, null, [["grunt", 46.36], ["groan", 7.39], ["livestock, farm animals, working animals", 7.03]], [["grunt", 28.0], ["music", 18.9], ["speech", 14.37]], null], "duration": [0.53, 0.98, 0.11, 2.08, 2.08, -0.19, 11.23, 0.6, 1.31, 1.11, 7.6, 10.16, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/eIAiu9_4JDs_filtered.json b/annotations_filtered/eIAiu9_4JDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1da4b63254d5d973b905e9c42e03fc5f73bd0620 --- /dev/null +++ b/annotations_filtered/eIAiu9_4JDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.33], [6.0, 6.18], [23.0, 31.21], [32.0, 48.25], [49.0, 50.79], [51.0, 52.46], [53.0, 54.14], [56.0, 58.23], [60.0, 60.34], [63.0, 84.43], [86.0, 91.49], [93.0, 103.25], [106.0, 121.9], [125.0, 137.19], [141.0, 142.25], [143.0, 145.32], [149.0, 156.0]], "keep_status": [false, false, true, false, false, false, false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.13, 54.23, 0.0, 0.0, 0.0, 81.89, 0.0, 32.14, 44.96, 43.35, 43.9, 36.52, 0.0, 42.55, 39.63], "audiomae_on_audioset": [null, null, [["music", 43.02], ["didgeridoo", 14.82], ["speech", 8.34]], null, null, null, null, null, null, [["music", 33.03], ["buzz", 10.81], ["breaking", 10.35]], [["music", 31.67], ["whale vocalization", 15.56], ["hum", 8.13]], [["music", 52.36], ["fly, housefly", 10.19], ["insect", 9.83]], [["music", 53.73], ["insect", 11.78], ["fly, housefly", 6.12]], [["speech", 21.42], ["hum", 10.4], ["music", 9.93]], null, [["fly, housefly", 31.68], ["speech", 22.29], ["bee, wasp, etc.", 16.04]], [["music", 60.69], ["scary music", 8.41], ["soundtrack music", 3.35]]], "duration": [1.33, 0.18, 8.21, 16.25, 1.79, 1.46, 1.14, 2.23, 0.34, 21.43, 5.49, 10.25, 15.9, 12.19, 1.25, 2.32, 7.0]} \ No newline at end of file diff --git a/annotations_filtered/eIlzY-UcYZU_filtered.json b/annotations_filtered/eIlzY-UcYZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..566b3a4f33e7eb36801a5e5261eb882eb1edb49c --- /dev/null +++ b/annotations_filtered/eIlzY-UcYZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.77], [6.0, 9.51], [12.0, 13.09], [15.0, 15.85], [17.0, 21.22], [24.0, 24.11], [26.0, 26.52], [29.0, 29.17], [31.0, 31.26], [33.0, 33.51], [40.0, 40.04], [43.0, 43.46], [45.0, 46.87], [49.0, 49.13], [51.0, 53.42], [54.0, 55.27], [62.0, 62.24], [65.0, 66.34], [67.0, 68.2], [70.0, 70.61], [71.0, 79.61], [81.0, 82.46], [83.0, 83.74], [93.0, 93.93], [95.0, 95.49], [98.0, 98.73], [99.0, 99.91], [102.0, 104.3], [105.0, 107.42], [108.0, 109.0], [111.0, 112.24], [113.0, 113.86], [115.0, 115.65], [122.0, 122.28], [123.0, 125.83], [127.0, 127.06], [128.0, 130.47], [132.0, 132.34], [133.0, 135.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.89, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 40.28, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 10.92], ["speech", 5.29], ["walk, footsteps", 4.5]], null, null, null, null, null, null, null, null, [["speech", 73.1], ["sidetone", 3.68], ["radio", 2.34]], null, null], "duration": [-0.23, 3.51, 1.09, 0.85, 4.22, 0.11, 0.52, 0.17, 0.26, 0.51, 0.04, 0.46, 1.87, 0.13, 2.42, 1.27, 0.24, 1.34, 1.2, 0.61, 8.61, 1.46, 0.74, 0.93, 0.49, 0.73, 0.91, 2.3, 2.42, 1.0, 1.24, 0.86, 0.65, 0.28, 2.83, 0.06, 2.47, 0.34, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/eIo_S0aHyfI_filtered.json b/annotations_filtered/eIo_S0aHyfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e426955ec1e5ec37c7bce0caa44336b6b9990955 --- /dev/null +++ b/annotations_filtered/eIo_S0aHyfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.29], [12.0, 22.87], [26.0, 32.61], [33.0, 39.61], [42.0, 45.74], [49.0, 65.52], [66.0, 69.28], [70.0, 70.26], [71.0, 72.32], [74.0, 82.07], [84.0, 84.79], [89.0, 98.86], [104.0, 104.82], [105.0, 105.26], [111.0, 112.16], [114.0, 132.17]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.79, 32.89, 30.37, 32.2, 33.05, 72.01, 0.0, 0.0, 98.99, 0.0, 78.72, 0.0, 0.0, 0.0, 36.24], "audiomae_on_audioset": [null, [["speech", 40.45], ["music", 31.22], ["electric shaver, electric razor", 8.86]], [["music", 42.41], ["speech", 9.38], ["vehicle", 4.47]], [["music", 69.38], ["theremin", 4.42], ["hum", 3.02]], [["moo", 14.98], ["cattle, bovinae", 14.41], ["music", 8.69]], [["mains hum", 17.86], ["hum", 17.37], ["whack, thwack", 16.12]], null, null, null, null, null, null, null, null, null, [["music", 52.35], ["hum", 10.1], ["throbbing", 9.26]]], "duration": [0.29, 10.87, 6.61, 6.61, 3.74, 16.52, 3.28, 0.26, 1.32, 8.07, 0.79, 9.86, 0.82, 0.26, 1.16, 18.17]} \ No newline at end of file diff --git a/annotations_filtered/eJ93IIgvVyI_filtered.json b/annotations_filtered/eJ93IIgvVyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74d1a686b226a6faa14eced0387faa50dae87262 --- /dev/null +++ b/annotations_filtered/eJ93IIgvVyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.77], [14.0, 15.82], [20.0, 20.83], [22.0, 21.84], [26.0, 27.01], [28.0, 28.73], [29.0, 33.84], [34.0, 37.1], [39.0, 46.6], [50.0, 51.09], [54.0, 56.39], [57.0, 58.55], [61.0, 61.94], [68.0, 70.34], [73.0, 74.09], [78.0, 78.07], [79.0, 79.84], [80.0, 94.12], [95.0, 95.77], [98.0, 100.85], [106.0, 114.99], [116.0, 117.61], [119.0, 119.72], [121.0, 123.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 52.68, 74.92, 48.19, 0.0, 78.55, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 62.99, 0.0, 42.67, 35.87, 0.0, 0.0, 40.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["didgeridoo", 46.52], ["music", 23.37], ["speech", 10.71]], null, null, null, null, null, null, null, null, null, null, [["music", 41.82], ["speech", 7.39], ["mantra", 5.16]], [["clang", 23.01], ["ding", 18.63], ["speech", 18.15]], null, null, [["throbbing", 22.82], ["hum", 17.2], ["sidetone", 13.07]]], "duration": [8.77, 1.82, 0.83, -0.16, 1.01, 0.73, 4.84, 3.1, 7.6, 1.09, 2.39, 1.55, 0.94, 2.34, 1.09, 0.07, 0.84, 14.12, 0.77, 2.85, 8.99, 1.61, 0.72, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/eJPXQfvokV8_filtered.json b/annotations_filtered/eJPXQfvokV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a78dd354bccbf13110b5d3c64f74c36a0b36014f --- /dev/null +++ b/annotations_filtered/eJPXQfvokV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.71], [26.0, 27.89], [29.0, 31.92], [32.0, 37.96], [42.0, 43.73], [45.0, 46.48], [47.0, 51.93], [52.0, 64.93], [66.0, 81.46], [83.0, 88.11]], "keep_status": [false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 65.91, 42.67, 0.0, 0.0, 60.05, 30.62, 29.89, 33.24], "audiomae_on_audioset": [null, null, null, [["mains hum", 62.58], ["hum", 23.7], ["speech", 4.07]], null, null, null, [["speech", 21.44], ["music", 13.18], ["sidetone", 7.08]], [["music", 35.6], ["speech", 8.07], ["whip", 3.77]], [["hum", 36.64], ["mains hum", 36.3], ["speech", 8.12]]], "duration": [1.71, 1.89, 2.92, 5.96, 1.73, 1.48, 4.93, 12.93, 15.46, 5.11]} \ No newline at end of file diff --git a/annotations_filtered/eJWSp6A1Ks0_filtered.json b/annotations_filtered/eJWSp6A1Ks0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6500c333e0816e3cabcd4abdc297c795965a793e --- /dev/null +++ b/annotations_filtered/eJWSp6A1Ks0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.82]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.82]} \ No newline at end of file diff --git a/annotations_filtered/eK20uOpc_AM_filtered.json b/annotations_filtered/eK20uOpc_AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81168fdc8ba14967e84ee4720bc7a99070475f56 --- /dev/null +++ b/annotations_filtered/eK20uOpc_AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.78], [18.0, 18.89], [20.0, 38.48], [40.0, 42.18], [43.0, 44.46], [45.0, 45.39], [48.0, 48.22], [50.0, 55.9], [57.0, 57.57], [59.0, 59.12], [64.0, 64.54], [84.0, 84.32], [88.0, 87.93], [89.0, 91.3], [93.0, 94.12], [95.0, 95.61], [98.0, 98.52], [101.0, 102.41], [103.0, 105.66], [110.0, 112.19], [115.0, 115.75], [119.0, 119.21], [121.0, 123.18], [124.0, 126.72], [132.0, 132.75], [133.0, 134.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.27, 0.0, 35.62, 45.49, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 90.43, 32.87, 0.0, 0.0, 35.12, 40.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.46], ["whack, thwack", 28.79], ["thunk", 11.25]], null, [["music", 46.28], ["speech", 20.4], ["whack, thwack", 16.95]], [["music", 59.58], ["throbbing", 8.45], ["hum", 5.17]], null, null, null, [["music", 59.98], ["speech", 13.75], ["theremin", 3.6]], null, null, null, null, null, null, null, null, null, null, null, [["music", 61.69], ["thunk", 4.35], ["bang", 4.16]], null, null, [["music", 36.4], ["burping, eructation", 27.93], ["grunt", 16.09]], [["music", 72.98], ["grunt", 9.28], ["didgeridoo", 3.45]], null, null], "duration": [3.78, 0.89, 18.48, 2.18, 1.46, 0.39, 0.22, 5.9, 0.57, 0.12, 0.54, 0.32, -0.07, 2.3, 1.12, 0.61, 0.52, 1.41, 2.66, 2.19, 0.75, 0.21, 2.18, 2.72, 0.75, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/eK5PghRFnBI_filtered.json b/annotations_filtered/eK5PghRFnBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71970e4289a70fd78bdbb1cf999540c850dd4059 --- /dev/null +++ b/annotations_filtered/eK5PghRFnBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.97], [9.0, 10.91], [13.0, 34.55], [35.0, 35.38], [36.0, 36.8], [37.0, 40.61], [41.0, 43.06], [48.0, 48.64], [50.0, 50.84]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.38, 0.0, 0.0, 34.12, 36.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 73.29], ["synthesizer", 5.47], ["musical instrument", 4.2]], null, null, [["music", 49.16], ["speech", 28.07], ["musical instrument", 7.51]], [["music", 69.62], ["boing", 13.81], ["speech", 4.48]], null, null], "duration": [-0.03, 1.91, 21.55, 0.38, 0.8, 3.61, 2.06, 0.64, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/eKCkxzJFP5M_filtered.json b/annotations_filtered/eKCkxzJFP5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62f6ab4193a6246db2ecd86e2758e1f974f99902 --- /dev/null +++ b/annotations_filtered/eKCkxzJFP5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.26], [17.0, 18.1], [19.0, 20.7], [24.0, 26.23], [28.0, 29.57], [32.0, 32.8], [35.0, 35.99], [37.0, 39.26], [41.0, 42.11], [44.0, 44.24], [49.0, 50.67], [54.0, 56.08], [59.0, 76.22], [79.0, 80.57], [84.0, 85.23], [86.0, 86.71], [90.0, 90.58], [92.0, 93.61], [95.0, 95.27], [96.0, 97.6], [99.0, 100.23], [104.0, 104.48], [106.0, 107.5], [120.0, 121.56], [122.0, 123.53], [126.0, 127.38], [129.0, 129.44], [131.0, 131.45], [133.0, 133.69], [135.0, 135.95], [145.0, 147.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.76, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 94.07, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.23], ["electronic music", 11.27], ["pulse", 4.45]]], "duration": [1.26, 1.1, 1.7, 2.23, 1.57, 0.8, 0.99, 2.26, 1.11, 0.24, 1.67, 2.08, 17.22, 1.57, 1.23, 0.71, 0.58, 1.61, 0.27, 1.6, 1.23, 0.48, 1.5, 1.56, 1.53, 1.38, 0.44, 0.45, 0.69, 0.95, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/eKCpwUXh_Qs_filtered.json b/annotations_filtered/eKCpwUXh_Qs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e70382282e7af674ca17d390eb9d209cd560601c --- /dev/null +++ b/annotations_filtered/eKCpwUXh_Qs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.01], [21.0, 21.93], [23.0, 24.54], [31.0, 32.81], [34.0, 34.67], [36.0, 55.68], [67.0, 73.5], [80.0, 82.16], [84.0, 84.97], [89.0, 89.77], [91.0, 92.85], [95.0, 96.09], [100.0, 100.79], [103.0, 104.52], [108.0, 108.45], [118.0, 122.69], [124.0, 130.35], [145.0, 145.3], [146.0, 147.88], [151.0, 151.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.35, 92.64, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 99.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["breaking", 38.92], ["music", 28.74], ["speech", 16.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.93, 1.54, 1.81, 0.67, 19.68, 6.5, 2.16, 0.97, 0.77, 1.85, 1.09, 0.79, 1.52, 0.45, 4.69, 6.35, 0.3, 1.88, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/eKJv3dWsZ7E_filtered.json b/annotations_filtered/eKJv3dWsZ7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f276db1fd06e30678a3186456fb6a097aa224a4 --- /dev/null +++ b/annotations_filtered/eKJv3dWsZ7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.11], [17.0, 17.73], [26.0, 26.33], [46.0, 46.2], [47.0, 48.73]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.11, 0.73, 0.33, 0.2, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/eKKd33QEB3I_filtered.json b/annotations_filtered/eKKd33QEB3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4717bf5a72ad86b545bfd679de74a77e15cc8446 --- /dev/null +++ b/annotations_filtered/eKKd33QEB3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.34], [14.0, 14.45], [21.0, 21.27], [24.0, 24.95], [26.0, 26.33], [28.0, 28.41], [30.0, 30.05], [34.0, 35.83]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.98], ["vehicle", 23.49], ["car", 13.76]], null, null, null, null, null, null, null], "duration": [5.34, 0.45, 0.27, 0.95, 0.33, 0.41, 0.05, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/eKLKoFIrXgg_filtered.json b/annotations_filtered/eKLKoFIrXgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08b3faa35cd7a6a217c659a392d0affcb5f90433 --- /dev/null +++ b/annotations_filtered/eKLKoFIrXgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [5.0, 7.23], [8.0, 9.36], [10.0, 14.62], [15.0, 16.85], [18.0, 18.96], [20.0, 21.36], [22.0, 22.77], [24.0, 24.73], [26.0, 26.23], [27.0, 27.84], [29.0, 32.63], [34.0, 36.12], [43.0, 52.2], [53.0, 54.55], [56.0, 56.54], [59.0, 60.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 85.9, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 61.27, 29.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.09], ["music", 20.59], ["gong", 12.08]], null, null, null], "duration": [0.81, 2.23, 1.36, 4.62, 1.85, 0.96, 1.36, 0.77, 0.73, 0.23, 0.84, 3.63, 2.12, 9.2, 1.55, 0.54, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/eKbXO0f-mvw_filtered.json b/annotations_filtered/eKbXO0f-mvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c1947b3e408a6fee92b79caf2118c303abd3013 --- /dev/null +++ b/annotations_filtered/eKbXO0f-mvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 31.08], [31.0, 38.16], [47.0, 55.32], [61.0, 72.49], [75.0, 89.45]], "keep_status": [true, false, true, true, true], "silence_prob": [31.47, 31.63, 31.91, 31.83, 31.33], "audiomae_on_audioset": [[["music", 31.57], ["hum", 14.05], ["electronic music", 9.81]], [["music", 35.97], ["speech", 34.07], ["throbbing", 8.35]], [["music", 61.08], ["synthesizer", 4.55], ["speech", 4.29]], [["music", 47.02], ["speech", 12.49], ["moo", 5.27]], [["music", 28.68], ["speech", 9.49], ["cattle, bovinae", 7.58]]], "duration": [6.08, 7.16, 8.32, 11.49, 14.45]} \ No newline at end of file diff --git a/annotations_filtered/eKeTSR1yYfY_filtered.json b/annotations_filtered/eKeTSR1yYfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b5874ab85115cf5d4934e6c8c4ce39f0ec10c61 --- /dev/null +++ b/annotations_filtered/eKeTSR1yYfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.09], [11.0, 11.21], [13.0, 15.31], [18.0, 18.27], [24.0, 23.94], [27.0, 26.96], [31.0, 31.58], [33.0, 33.39], [42.0, 43.33], [45.0, 45.59], [49.0, 49.65], [51.0, 51.48], [52.0, 52.68], [57.0, 58.16], [60.0, 61.37], [63.0, 64.76], [66.0, 66.41], [69.0, 74.8], [75.0, 83.19], [84.0, 114.76], [118.0, 118.71], [122.0, 137.17], [143.0, 145.64], [148.0, 155.53]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 44.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 32.48, 0.0, 0.0, 32.5, 30.41, 33.16], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 34.55], ["cattle, bovinae", 9.79], ["music", 8.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.94], ["theremin", 21.1], ["synthesizer", 5.16]], [["music", 39.45], ["speech", 25.14], ["thunk", 7.15]], null, null, [["music", 36.83], ["speech", 29.12], ["whack, thwack", 8.53]], [["music", 25.21], ["speech", 18.18], ["cacophony", 6.58]], [["music", 74.59], ["speech", 9.07], ["electronic music", 1.63]]], "duration": [1.09, 0.21, 2.31, 0.27, -0.06, -0.04, 0.58, 0.39, 1.33, 0.59, 0.65, 0.48, 0.68, 1.16, 1.37, 1.76, 0.41, 5.8, 8.19, 30.76, 0.71, 15.17, 2.64, 7.53]} \ No newline at end of file diff --git a/annotations_filtered/eKmMFRdNCEw_filtered.json b/annotations_filtered/eKmMFRdNCEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ba5bbe47cd93dcea8b92354f3b79dd91dcbf7f8 --- /dev/null +++ b/annotations_filtered/eKmMFRdNCEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.22], [20.0, 22.91], [24.0, 27.14], [32.0, 32.68], [34.0, 35.56], [39.0, 38.91], [40.0, 39.99], [41.0, 42.75], [44.0, 49.49], [50.0, 51.58], [52.0, 54.75], [58.0, 58.29], [60.0, 60.84], [68.0, 68.44], [70.0, 71.61], [72.0, 73.23], [76.0, 78.04], [79.0, 80.81], [82.0, 83.13], [84.0, 86.02], [90.0, 91.37], [92.0, 95.12], [97.0, 98.29], [99.0, 99.74], [107.0, 107.3], [110.0, 110.35], [111.0, 123.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.09, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 99.44, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 2.91, 3.14, 0.68, 1.56, -0.09, -0.01, 1.75, 5.49, 1.58, 2.75, 0.29, 0.84, 0.44, 1.61, 1.23, 2.04, 1.81, 1.13, 2.02, 1.37, 3.12, 1.29, 0.74, 0.3, 0.35, 12.67]} \ No newline at end of file diff --git a/annotations_filtered/eKrEVWGTuRg_filtered.json b/annotations_filtered/eKrEVWGTuRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c4ca241137f04bb902120df191f281f10a98ab9 --- /dev/null +++ b/annotations_filtered/eKrEVWGTuRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.83], [8.0, 12.56], [13.0, 13.86], [15.0, 16.01], [18.0, 18.52], [21.0, 22.15], [24.0, 24.26], [25.0, 25.96], [27.0, 29.71], [33.0, 33.22], [34.0, 35.02], [42.0, 42.52], [46.0, 47.55], [51.0, 51.07], [53.0, 55.83], [57.0, 58.29], [59.0, 59.66], [63.0, 63.36], [67.0, 67.58], [71.0, 72.2], [75.0, 76.08], [87.0, 96.03], [97.0, 97.12], [99.0, 100.23], [105.0, 109.48], [115.0, 115.57], [118.0, 120.21], [121.0, 138.1], [145.0, 145.79], [153.0, 165.16], [167.0, 170.92]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [35.19, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 45.62, 0.0, 63.31, 56.18, 0.0, 32.76, 89.9], "audiomae_on_audioset": [[["speech", 63.31], ["hum", 4.81], ["bee, wasp, etc.", 3.82]], null, null, null, null, null, null, null, [["music", 11.45], ["hum", 8.97], ["speech", 7.42]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.0], ["inside, small room", 2.75], ["screaming", 2.35]], null, null, [["whale vocalization", 25.06], ["dial tone", 12.53], ["busy signal", 6.6]], null, null, null, null, [["beatboxing", 31.01], ["whack, thwack", 9.26], ["speech", 8.77]], null], "duration": [5.83, 4.56, 0.86, 1.01, 0.52, 1.15, 0.26, 0.96, 2.71, 0.22, 1.02, 0.52, 1.55, 0.07, 2.83, 1.29, 0.66, 0.36, 0.58, 1.2, 1.08, 9.03, 0.12, 1.23, 4.48, 0.57, 2.21, 17.1, 0.79, 12.16, 3.92]} \ No newline at end of file diff --git a/annotations_filtered/eKxv7whkFMM_filtered.json b/annotations_filtered/eKxv7whkFMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb7dfcda99a6bb2bb7f8b26c257987cb13b7cba0 --- /dev/null +++ b/annotations_filtered/eKxv7whkFMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.62], [27.0, 27.21], [30.0, 30.37], [30.0, 30.42], [47.0, 48.63], [51.0, 51.88], [55.0, 56.35], [63.0, 64.18], [65.0, 79.62], [81.0, 82.07]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [31.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.75, 0.0], "audiomae_on_audioset": [[["speech", 17.58], ["moo", 16.89], ["cattle, bovinae", 13.61]], null, null, null, null, null, null, null, [["speech", 50.68], ["whale vocalization", 6.55], ["animal", 5.46]], null], "duration": [4.62, 0.21, 0.37, 0.42, 1.63, 0.88, 1.35, 1.18, 14.62, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/eL2DjnXT4wQ_filtered.json b/annotations_filtered/eL2DjnXT4wQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ec35caaa8248521b7191ced0ccb7ef6ff734fa --- /dev/null +++ b/annotations_filtered/eL2DjnXT4wQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.64], [17.0, 16.95], [19.0, 29.35], [30.0, 30.99]], "keep_status": [false, false, true, false], "silence_prob": [34.03, 0.0, 39.17, 0.0], "audiomae_on_audioset": [[["music", 65.71], ["musical instrument", 6.75], ["guitar", 5.75]], null, [["music", 41.12], ["speech", 22.48], ["shuffling cards", 4.98]], null], "duration": [7.64, -0.05, 10.35, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/eL62rDiuqDE_filtered.json b/annotations_filtered/eL62rDiuqDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51d069d3abd02b3c7ef776efd7ebedc70cc414fc --- /dev/null +++ b/annotations_filtered/eL62rDiuqDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 94.76], [95.0, 95.08], [97.0, 100.23], [103.0, 119.5], [120.0, 121.12], [126.0, 127.53], [130.0, 130.64], [133.0, 133.74], [135.0, 136.32], [139.0, 140.66], [141.0, 145.89]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [46.36, 0.0, 81.89, 40.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 41.91], ["cattle, bovinae", 22.05], ["moo", 17.95]], null, null, [["livestock, farm animals, working animals", 27.36], ["moo", 18.07], ["cattle, bovinae", 15.9]], null, null, null, null, null, null, null], "duration": [14.76, 0.08, 3.23, 16.5, 1.12, 1.53, 0.64, 0.74, 1.32, 1.66, 4.89]} \ No newline at end of file diff --git a/annotations_filtered/eL9aiYpAyI0_filtered.json b/annotations_filtered/eL9aiYpAyI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b33c1c4decfa57415e2094c14a6b6f68a7392a98 --- /dev/null +++ b/annotations_filtered/eL9aiYpAyI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.07], [17.0, 18.57], [35.0, 35.13], [36.0, 36.53], [38.0, 41.91], [48.0, 58.08], [61.0, 62.23]], "keep_status": [false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.52, 34.57, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 18.02], ["music", 7.54], ["fart", 6.07]], [["music", 19.76], ["speech", 12.26], ["chant", 8.35]], null], "duration": [0.07, 1.57, 0.13, 0.53, 3.91, 10.08, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/eLFf1LzuM1Q_filtered.json b/annotations_filtered/eLFf1LzuM1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d9e8d914bbc59ea8bfa1bcac3d792b6bc4a33c1 --- /dev/null +++ b/annotations_filtered/eLFf1LzuM1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.58], [15.0, 15.5], [17.0, 17.69], [22.0, 22.18], [28.0, 28.51], [30.0, 31.04], [32.0, 32.31], [35.0, 36.8], [37.0, 37.86], [39.0, 40.88], [41.0, 48.29], [49.0, 52.32], [54.0, 56.0], [59.0, 60.08], [61.0, 66.06], [68.0, 68.13], [70.0, 75.42], [77.0, 81.5], [82.0, 84.37], [85.0, 91.08], [92.0, 93.38], [96.0, 95.93], [97.0, 97.33], [98.0, 99.03], [101.0, 101.73], [106.0, 106.08], [108.0, 110.69], [111.0, 115.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 83.16, 96.54, 0.0, 98.1, 0.0, 94.52, 99.1, 98.8, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.58, 0.5, 0.69, 0.18, 0.51, 1.04, 0.31, 1.8, 0.86, 1.88, 7.29, 3.32, 2.0, 1.08, 5.06, 0.13, 5.42, 4.5, 2.37, 6.08, 1.38, -0.07, 0.33, 1.03, 0.73, 0.08, 2.69, 4.91]} \ No newline at end of file diff --git a/annotations_filtered/eLLzlb1SN2M_filtered.json b/annotations_filtered/eLLzlb1SN2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd8b3e0a3d23102c5f1c4a0e838cf3861842669f --- /dev/null +++ b/annotations_filtered/eLLzlb1SN2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [4.0, 16.43], [19.0, 20.31], [24.0, 26.49], [27.0, 28.29], [30.0, 30.45], [32.0, 35.13], [35.0, 36.61], [38.0, 41.61], [43.0, 46.41], [57.0, 57.43], [62.0, 63.29], [66.0, 68.55], [70.0, 76.54], [80.0, 91.81], [93.0, 94.2], [97.0, 104.26], [106.0, 106.88], [110.0, 113.78], [115.0, 124.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 65.44, 0.0, 99.98, 0.0, 0.0, 100.0, 0.0, 99.26, 94.22, 0.0, 0.0, 88.64, 99.98, 34.25, 0.0, 55.89, 0.0, 75.88, 46.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.88], ["screaming", 5.68], ["explosion", 5.1]], null, null, null, null, [["music", 72.33], ["speech", 6.38], ["throbbing", 1.8]]], "duration": [1.06, 12.43, 1.31, 2.49, 1.29, 0.45, 3.13, 1.61, 3.61, 3.41, 0.43, 1.29, 2.55, 6.54, 11.81, 1.2, 7.26, 0.88, 3.78, 9.65]} \ No newline at end of file diff --git a/annotations_filtered/eLW6uxK_MOI_filtered.json b/annotations_filtered/eLW6uxK_MOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ef779429ab90ff00f8a80b001283c557e2dc640 --- /dev/null +++ b/annotations_filtered/eLW6uxK_MOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.78]], "keep_status": [true], "silence_prob": [31.76], "audiomae_on_audioset": [[["music", 35.37], ["speech", 15.08], ["crowd", 4.13]]], "duration": [2.78]} \ No newline at end of file diff --git a/annotations_filtered/eLdQluY23UI_filtered.json b/annotations_filtered/eLdQluY23UI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fefe05d16a8b0260615865f040df6a68722cdfac --- /dev/null +++ b/annotations_filtered/eLdQluY23UI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.34], [6.0, 7.84], [8.0, 9.64], [10.0, 17.74], [21.0, 22.1], [28.0, 31.14], [33.0, 43.11], [50.0, 50.36], [53.0, 53.0], [54.0, 56.12], [57.0, 57.6], [60.0, 60.17], [65.0, 64.74], [65.0, 65.48], [68.0, 67.95], [69.0, 69.01], [70.0, 69.84], [71.0, 73.09], [74.0, 78.33], [79.0, 80.4], [91.0, 95.64], [96.0, 97.02], [100.0, 100.57], [102.0, 106.49], [110.0, 116.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.37, 0.0, 94.52, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.59, 0.0, 82.43, 0.0, 0.0, 100.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 1.84, 1.64, 7.74, 1.1, 3.14, 10.11, 0.36, 0.0, 2.12, 0.6, 0.17, -0.26, 0.48, -0.05, 0.01, -0.16, 2.09, 4.33, 1.4, 4.64, 1.02, 0.57, 4.49, 6.46]} \ No newline at end of file diff --git a/annotations_filtered/eLyhRYJXf1U_filtered.json b/annotations_filtered/eLyhRYJXf1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3cb5397fe727aa364a0c0475a72fe9b40747e5c --- /dev/null +++ b/annotations_filtered/eLyhRYJXf1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 31.92], [34.0, 58.77], [59.0, 58.82], [59.0, 60.57], [63.0, 72.28], [76.0, 90.53], [93.0, 115.96], [117.0, 118.07], [123.0, 127.41], [127.0, 127.62], [130.0, 141.67], [143.0, 145.99], [147.0, 163.61], [165.0, 169.74]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [33.83, 30.31, 0.0, 0.0, 34.24, 30.32, 30.06, 0.0, 29.75, 0.0, 31.88, 46.5, 29.88, 30.18], "audiomae_on_audioset": [[["speech", 30.19], ["music", 21.42], ["sidetone", 6.59]], [["music", 54.81], ["throbbing", 12.63], ["hum", 8.62]], null, null, [["music", 78.31], ["hum", 5.1], ["whale vocalization", 2.51]], [["speech", 48.68], ["music", 14.6], ["explosion", 8.41]], [["music", 54.95], ["cacophony", 7.09], ["hum", 5.96]], null, [["music", 62.35], ["electronic music", 5.26], ["throbbing", 3.65]], null, [["mains hum", 40.3], ["hum", 30.19], ["music", 14.24]], [["hum", 17.12], ["music", 15.75], ["mains hum", 15.27]], [["music", 35.14], ["hum", 9.82], ["civil defense siren", 9.52]], [["explosion", 17.63], ["hum", 15.2], ["music", 12.89]]], "duration": [19.92, 24.77, -0.18, 1.57, 9.28, 14.53, 22.96, 1.07, 4.41, 0.62, 11.67, 2.99, 16.61, 4.74]} \ No newline at end of file diff --git a/annotations_filtered/eM3CovgD8Bo_filtered.json b/annotations_filtered/eM3CovgD8Bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b25c5e0406e90409320e89a6f3c6ed781e5d9441 --- /dev/null +++ b/annotations_filtered/eM3CovgD8Bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.7], [6.0, 7.59], [10.0, 10.81], [12.0, 13.09], [13.0, 14.18], [16.0, 17.47], [25.0, 26.16], [28.0, 28.71], [31.0, 31.11], [33.0, 35.07], [37.0, 37.07], [45.0, 46.8], [50.0, 50.67], [57.0, 57.33], [75.0, 75.29], [86.0, 86.09], [106.0, 106.03], [113.0, 114.24], [115.0, 116.14], [117.0, 116.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 1.59, 0.81, 1.09, 1.18, 1.47, 1.16, 0.71, 0.11, 2.07, 0.07, 1.8, 0.67, 0.33, 0.29, 0.09, 0.03, 1.24, 1.14, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/eMFxQti1xHU_filtered.json b/annotations_filtered/eMFxQti1xHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de526496fa0fe6d05215317dc29ecb2194ed1855 --- /dev/null +++ b/annotations_filtered/eMFxQti1xHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.84], [25.0, 27.13], [28.0, 28.51], [31.0, 30.6], [46.0, 47.19], [48.0, 48.49], [57.0, 58.94], [61.0, 65.79], [69.0, 74.44], [76.0, 77.87], [80.0, 84.43], [101.0, 102.22], [115.0, 117.21], [128.0, 127.95]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 38.95, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 76.86, 0.0, 60.51, 0.0, 46.54, 0.0], "audiomae_on_audioset": [null, [["speech", 33.0], ["music", 18.96], ["stomach rumble", 3.75]], null, null, null, null, null, null, null, null, null, null, [["music", 27.59], ["synthesizer", 5.78], ["vehicle", 5.67]], null], "duration": [1.84, 2.13, 0.51, -0.4, 1.19, 0.49, 1.94, 4.79, 5.44, 1.87, 4.43, 1.22, 2.21, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/eMHv9pPuDiI_filtered.json b/annotations_filtered/eMHv9pPuDiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c3c600c8f916379cb8d008c21b561ad5f4d6ef0 --- /dev/null +++ b/annotations_filtered/eMHv9pPuDiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.26], [12.0, 15.6], [17.0, 18.44], [19.0, 23.4], [24.0, 25.62], [31.0, 34.01], [36.0, 37.49], [40.0, 49.25], [51.0, 67.53], [69.0, 73.79], [77.0, 77.28], [82.0, 83.47], [85.0, 86.83], [88.0, 95.98], [101.0, 105.95], [107.0, 113.54]], "keep_status": [true, false, false, false, false, true, false, true, false, true, false, false, false, false, false, true], "silence_prob": [29.44, 31.23, 0.0, 30.76, 0.0, 32.33, 0.0, 29.21, 29.86, 29.59, 0.0, 0.0, 0.0, 29.68, 29.73, 29.81], "audiomae_on_audioset": [[["music", 56.71], ["cacophony", 3.45], ["electronic music", 2.12]], [["fly, housefly", 57.16], ["insect", 18.37], ["bee, wasp, etc.", 10.87]], null, [["throbbing", 41.6], ["hum", 17.09], ["music", 12.92]], null, [["music", 45.68], ["buzz", 10.62], ["scary music", 4.65]], null, [["music", 29.95], ["explosion", 18.01], ["hum", 9.87]], [["hum", 40.16], ["music", 22.54], ["throbbing", 18.92]], [["music", 41.28], ["speech", 22.49], ["throbbing", 5.1]], null, null, null, [["hum", 39.2], ["throbbing", 20.23], ["mains hum", 18.13]], [["speech", 30.9], ["hum", 24.07], ["mains hum", 21.47]], [["speech", 43.04], ["music", 11.9], ["eruption", 3.8]]], "duration": [5.26, 3.6, 1.44, 4.4, 1.62, 3.01, 1.49, 9.25, 16.53, 4.79, 0.28, 1.47, 1.83, 7.98, 4.95, 6.54]} \ No newline at end of file diff --git a/annotations_filtered/eMURCJgRJYM_filtered.json b/annotations_filtered/eMURCJgRJYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f54cd42a3d7716cd527e7aa63ebcbf32ebba698 --- /dev/null +++ b/annotations_filtered/eMURCJgRJYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.98], [11.0, 42.31], [43.0, 43.24], [45.0, 49.82], [53.0, 54.58], [55.0, 62.19], [64.0, 80.94], [84.0, 89.26], [90.0, 90.22], [96.0, 96.75], [101.0, 100.94], [103.0, 103.67], [106.0, 107.52], [109.0, 109.34]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.64, 0.0, 45.92, 31.0, 53.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 47.51], ["speech", 23.48], ["throbbing", 10.44]], null, [["hum", 29.52], ["throbbing", 23.88], ["music", 18.93]], [["music", 31.13], ["speech", 29.22], ["didgeridoo", 6.66]], null, null, null, null, null, null, null], "duration": [-0.02, 31.31, 0.24, 4.82, 1.58, 7.19, 16.94, 5.26, 0.22, 0.75, -0.06, 0.67, 1.52, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/eMgfTq1Z2n8_filtered.json b/annotations_filtered/eMgfTq1Z2n8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e945aeb5d3713de4716d832bac89e6a73573d9fd --- /dev/null +++ b/annotations_filtered/eMgfTq1Z2n8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [8.0, 8.6], [11.0, 17.46], [18.0, 30.97], [34.0, 34.33], [42.0, 49.44], [54.0, 55.0], [66.0, 72.39], [75.0, 81.51], [84.0, 83.96], [84.0, 85.94], [87.0, 89.56], [91.0, 91.2], [92.0, 92.53], [95.0, 95.98], [97.0, 98.22], [99.0, 98.96], [103.0, 110.81], [112.0, 122.49], [123.0, 131.25], [133.0, 138.96], [141.0, 141.59], [144.0, 146.04], [149.0, 151.63]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.07, 37.67, 0.0, 49.68, 0.0, 41.87, 51.18, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 0.0, 33.91, 54.23, 97.22, 97.92, 0.0, 53.4, 94.52], "audiomae_on_audioset": [null, null, null, [["hum", 27.76], ["speech", 19.05], ["mains hum", 17.94]], null, [["hum", 32.76], ["mains hum", 21.87], ["buzz", 11.86]], null, [["speech", 40.83], ["music", 33.21], ["animal", 4.3]], null, null, null, [["music", 45.83], ["hum", 11.49], ["electronic music", 6.85]], null, null, null, null, null, [["music", 40.99], ["didgeridoo", 17.3], ["hum", 7.88]], null, null, null, null, null, null], "duration": [1.62, 0.6, 6.46, 12.97, 0.33, 7.44, 1.0, 6.39, 6.51, -0.04, 1.94, 2.56, 0.2, 0.53, 0.98, 1.22, -0.04, 7.81, 10.49, 8.25, 5.96, 0.59, 2.04, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/eMuBBjnM4yo_filtered.json b/annotations_filtered/eMuBBjnM4yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2422f60e61fb5181c6f08080584dba6b842fcfe1 --- /dev/null +++ b/annotations_filtered/eMuBBjnM4yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.25], [23.0, 25.35], [26.0, 29.25], [29.0, 29.88], [33.0, 35.21], [37.0, 37.34], [39.0, 39.09], [41.0, 42.16], [46.0, 46.5], [53.0, 54.7], [59.0, 60.59], [61.0, 62.67], [63.0, 67.05], [69.0, 69.47], [72.0, 72.42], [74.0, 74.71], [77.0, 81.4], [82.0, 83.15], [84.0, 85.35], [89.0, 89.13], [90.0, 94.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.11, 88.1, 46.05, 0.0, 57.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 99.78], "audiomae_on_audioset": [null, null, [["speech", 30.63], ["fart", 15.67], ["fly, housefly", 8.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.25, 2.35, 3.25, 0.88, 2.21, 0.34, 0.09, 1.16, 0.5, 1.7, 1.59, 1.67, 4.05, 0.47, 0.42, 0.71, 4.4, 1.15, 1.35, 0.13, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/eMyuRmZNaTk_filtered.json b/annotations_filtered/eMyuRmZNaTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c308f687939d8f7ddd5a8ea7996a511056f1dc26 --- /dev/null +++ b/annotations_filtered/eMyuRmZNaTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[149.0, 150.58], [154.0, 219.77]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.58, 65.77]} \ No newline at end of file diff --git a/annotations_filtered/eN4fDGHpf_c_filtered.json b/annotations_filtered/eN4fDGHpf_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b96440fdb88858d46320586235f4633b511e8788 --- /dev/null +++ b/annotations_filtered/eN4fDGHpf_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.44], [14.0, 14.74], [20.0, 23.94], [32.0, 33.35], [44.0, 44.51], [49.0, 62.48]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 36.59, 0.0, 0.0, 31.71], "audiomae_on_audioset": [null, null, [["music", 21.33], ["didgeridoo", 16.69], ["speech", 15.93]], null, null, [["speech", 54.53], ["music", 36.29], ["didgeridoo", 1.13]]], "duration": [1.44, 0.74, 3.94, 1.35, 0.51, 13.48]} \ No newline at end of file diff --git a/annotations_filtered/eN7zGm5KKrI_filtered.json b/annotations_filtered/eN7zGm5KKrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df78e4b4ada3c1c5a61d96794366845d68d4b9b3 --- /dev/null +++ b/annotations_filtered/eN7zGm5KKrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [5.0, 5.61], [13.0, 18.76], [20.0, 24.93], [26.0, 28.43], [30.0, 44.36], [46.0, 46.41], [47.0, 47.58], [50.0, 51.04], [52.0, 53.2], [54.0, 56.1], [57.0, 56.93], [58.0, 59.76], [63.0, 64.86], [68.0, 78.49], [79.0, 82.34], [85.0, 86.24], [90.0, 94.07], [97.0, 97.36], [98.0, 98.15], [104.0, 107.64], [108.0, 110.78], [112.0, 113.36], [114.0, 114.78], [115.0, 121.17], [127.0, 128.06], [129.0, 129.2]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.42, 47.31, 30.7, 31.42, 0.0, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 30.48, 57.17, 0.0, 30.47, 0.0, 0.0, 32.12, 90.6, 0.0, 0.0, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 15.82], ["hum", 15.16], ["chirp tone", 13.56]], [["sine wave", 12.18], ["hum", 10.59], ["chirp tone", 10.04]], [["scratching (performance technique)", 20.75], ["speech", 16.75], ["beatboxing", 10.88]], [["whack, thwack", 35.14], ["speech", 31.41], ["music", 10.21]], null, null, null, null, null, null, null, null, [["music", 62.8], ["speech", 16.24], ["whack, thwack", 2.46]], null, null, [["music", 56.35], ["speech", 13.23], ["whack, thwack", 5.24]], null, null, [["didgeridoo", 60.83], ["music", 10.77], ["frog", 8.8]], null, null, null, null, null, null], "duration": [1.48, 0.61, 5.76, 4.93, 2.43, 14.36, 0.41, 0.58, 1.04, 1.2, 2.1, -0.07, 1.76, 1.86, 10.49, 3.34, 1.24, 4.07, 0.36, 0.15, 3.64, 2.78, 1.36, 0.78, 6.17, 1.06, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/eNCK08cInIE_filtered.json b/annotations_filtered/eNCK08cInIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb5cb08847cf8559b9ccfeb4c85d778e3cba7cd4 --- /dev/null +++ b/annotations_filtered/eNCK08cInIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.73], [19.0, 29.05], [30.0, 30.5], [31.0, 32.85], [37.0, 37.42], [41.0, 42.5], [47.0, 48.51], [50.0, 50.97], [54.0, 57.5], [62.0, 64.03], [68.0, 69.4], [73.0, 72.84], [73.0, 75.59], [77.0, 77.36], [79.0, 80.84], [85.0, 84.69], [86.0, 88.37], [89.0, 91.03], [92.0, 92.6], [98.0, 101.61], [102.0, 102.3], [103.0, 109.81], [110.0, 110.39], [115.0, 116.01], [117.0, 117.49], [121.0, 122.01]], "keep_status": [false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.59, 34.65, 0.0, 0.0, 32.23, 0.0, 0.0, 0.0, 31.86, 34.04, 0.0, 29.7, 0.0, 28.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 25.76], ["mosquito", 19.3], ["ding", 6.99]], null, null, null, null, null, null, [["music", 15.56], ["speech", 15.37], ["vehicle", 9.32]], [["hum", 31.73], ["throbbing", 19.64], ["mains hum", 17.67]], null, null, [["speech", 64.56], ["music", 4.3], ["sidetone", 2.8]], null, null, null, [["speech", 28.65], ["sidetone", 20.52], ["music", 13.26]], [["throbbing", 40.5], ["music", 23.11], ["hum", 21.02]], null, [["music", 37.38], ["didgeridoo", 29.39], ["beatboxing", 10.85]], null, [["cattle, bovinae", 33.74], ["livestock, farm animals, working animals", 17.59], ["moo", 15.71]], null, null, null, null], "duration": [0.73, 10.05, 0.5, 1.85, 0.42, 1.5, 1.51, 0.97, 3.5, 2.03, 1.4, -0.16, 2.59, 0.36, 1.84, -0.31, 2.37, 2.03, 0.6, 3.61, 0.3, 6.81, 0.39, 1.01, 0.49, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/eNnr60_UZtg_filtered.json b/annotations_filtered/eNnr60_UZtg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..869ec3f1da6eb2dffd8bcc12d0574deee5b35c4b --- /dev/null +++ b/annotations_filtered/eNnr60_UZtg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 60.78], [83.0, 84.57], [90.0, 93.83], [94.0, 95.37], [96.0, 96.53]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [-0.22, 1.57, 3.83, 1.37, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/eO1Jm4N4rlA_filtered.json b/annotations_filtered/eO1Jm4N4rlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1071566ce19d9ce3fc8c2d9fea4ab0a538c27bf2 --- /dev/null +++ b/annotations_filtered/eO1Jm4N4rlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.61], [12.0, 13.19], [17.0, 18.47], [21.0, 23.75], [25.0, 25.32], [27.0, 27.82], [31.0, 31.72], [35.0, 35.38], [36.0, 37.05], [38.0, 38.11], [52.0, 55.09], [56.0, 56.96], [58.0, 58.06], [59.0, 60.83], [62.0, 61.94], [63.0, 64.69], [66.0, 67.09], [70.0, 70.88], [72.0, 75.0], [76.0, 76.1], [79.0, 79.42], [81.0, 81.04], [81.0, 92.53], [95.0, 96.16], [100.0, 100.25], [103.0, 104.38], [108.0, 108.11], [112.0, 111.99], [116.0, 115.8], [121.0, 122.71], [124.0, 129.07], [130.0, 131.23], [133.0, 145.74], [147.0, 147.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 99.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 50.65], ["boing", 26.74], ["sidetone", 3.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.19, 1.47, 2.75, 0.32, 0.82, 0.72, 0.38, 1.05, 0.11, 3.09, 0.96, 0.06, 1.83, -0.06, 1.69, 1.09, 0.88, 3.0, 0.1, 0.42, 0.04, 11.53, 1.16, 0.25, 1.38, 0.11, -0.01, -0.2, 1.71, 5.07, 1.23, 12.74, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/eOYwXi0B6KQ_filtered.json b/annotations_filtered/eOYwXi0B6KQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53b6aa3747b3ba2c169fbcc8178e22e9f9840584 --- /dev/null +++ b/annotations_filtered/eOYwXi0B6KQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.85], [14.0, 14.37], [15.0, 24.93], [27.0, 27.06], [35.0, 36.46], [39.0, 39.9], [42.0, 42.65], [47.0, 48.47], [54.0, 54.35], [56.0, 64.32], [67.0, 72.01], [74.0, 76.23], [81.0, 81.48], [82.0, 87.54], [89.0, 89.09], [91.0, 108.82], [113.0, 130.11], [132.0, 137.81], [140.0, 140.1]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.65, 0.0, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.55, 34.89, 38.84, 0.0, 78.04, 0.0, 47.46, 35.91, 41.89, 0.0], "audiomae_on_audioset": [[["music", 45.57], ["speech", 14.78], ["music of latin america", 4.79]], null, [["music", 49.47], ["didgeridoo", 5.9], ["throbbing", 4.44]], null, null, null, null, null, null, [["music", 68.26], ["speech", 5.3], ["boing", 5.26]], [["music", 55.63], ["fly, housefly", 9.64], ["insect", 7.67]], [["speech", 52.53], ["thunk", 9.75], ["whack, thwack", 5.85]], null, null, null, [["music", 68.36], ["boing", 7.18], ["synthesizer", 4.1]], [["music", 51.36], ["didgeridoo", 11.29], ["speech", 9.24]], [["speech", 62.57], ["whack, thwack", 27.35], ["groan", 1.82]], null], "duration": [4.85, 0.37, 9.93, 0.06, 1.46, 0.9, 0.65, 1.47, 0.35, 8.32, 5.01, 2.23, 0.48, 5.54, 0.09, 17.82, 17.11, 5.81, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/eOcimzsviFA_filtered.json b/annotations_filtered/eOcimzsviFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b364a00f00464d804648aea7cb1e92fb034b32b8 --- /dev/null +++ b/annotations_filtered/eOcimzsviFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [15.0, 15.52], [18.0, 19.4], [21.0, 23.38], [26.0, 27.28], [29.0, 30.18], [35.0, 36.1], [37.0, 39.56], [52.0, 52.76], [54.0, 55.59], [61.0, 61.82], [65.0, 66.65], [68.0, 71.37], [74.0, 74.95], [76.0, 77.18], [81.0, 82.54], [85.0, 85.38], [88.0, 88.82], [96.0, 96.85], [103.0, 103.71], [105.0, 105.71], [107.0, 108.58], [113.0, 113.36], [115.0, 116.28], [118.0, 118.57], [121.0, 122.0], [125.0, 127.2], [130.0, 131.46], [133.0, 133.47], [136.0, 137.42], [140.0, 140.66], [143.0, 145.23], [150.0, 150.57], [152.0, 153.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.52, 1.4, 2.38, 1.28, 1.18, 1.1, 2.56, 0.76, 1.59, 0.82, 1.65, 3.37, 0.95, 1.18, 1.54, 0.38, 0.82, 0.85, 0.71, 0.71, 1.58, 0.36, 1.28, 0.57, 1.0, 2.2, 1.46, 0.47, 1.42, 0.66, 2.23, 0.57, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/eOdZMwIh1I8_filtered.json b/annotations_filtered/eOdZMwIh1I8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7bc882b1b5077f40a48b6cbb90ee6cfc630e384 --- /dev/null +++ b/annotations_filtered/eOdZMwIh1I8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.31], [29.0, 31.26], [33.0, 33.47], [34.0, 34.35], [36.0, 36.46], [38.0, 38.1], [41.0, 41.0], [43.0, 43.34], [44.0, 45.55], [50.0, 50.99], [52.0, 52.86], [53.0, 54.08], [55.0, 55.49], [56.0, 59.36], [61.0, 62.38], [63.0, 63.44], [65.0, 65.28], [71.0, 72.08], [75.0, 75.47], [79.0, 78.73], [86.0, 86.98], [93.0, 92.75], [97.0, 98.66], [104.0, 103.89], [109.0, 112.94], [114.0, 118.66], [120.0, 121.47], [122.0, 124.21], [125.0, 128.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 48.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 48.35, 0.0, 52.74, 56.63], "audiomae_on_audioset": [null, [["music", 59.01], ["throbbing", 11.53], ["synthesizer", 4.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 27.53], ["mains hum", 15.02], ["speech", 6.63]], null, null, null], "duration": [0.31, 2.26, 0.47, 0.35, 0.46, 0.1, 0.0, 0.34, 1.55, 0.99, 0.86, 1.08, 0.49, 3.36, 1.38, 0.44, 0.28, 1.08, 0.47, -0.27, 0.98, -0.25, 1.66, -0.11, 3.94, 4.66, 1.47, 2.21, 3.48]} \ No newline at end of file diff --git a/annotations_filtered/eP52omnnZmg_filtered.json b/annotations_filtered/eP52omnnZmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb586cecb85e9bde3fb6c4cc3f5f2037dc5ec875 --- /dev/null +++ b/annotations_filtered/eP52omnnZmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.87], [11.0, 11.2], [14.0, 14.55], [16.0, 16.12], [18.0, 20.02], [21.0, 20.93], [24.0, 26.0], [29.0, 29.52], [40.0, 40.88], [42.0, 42.85], [50.0, 50.95], [64.0, 65.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 55.6, 0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.2, 0.55, 0.12, 2.02, -0.07, 2.0, 0.52, 0.88, 0.85, 0.95, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/eP7cLId4ocM_filtered.json b/annotations_filtered/eP7cLId4ocM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7682dd8c6ec6160ba27263344c76c5652442d4ef --- /dev/null +++ b/annotations_filtered/eP7cLId4ocM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.84], [23.0, 27.28], [30.0, 37.49], [38.0, 39.19], [41.0, 41.07], [42.0, 46.41], [48.0, 48.36], [49.0, 52.84], [54.0, 62.36], [64.0, 71.54], [72.0, 72.17], [74.0, 79.71], [82.0, 90.86], [93.0, 105.11], [107.0, 109.48], [114.0, 114.27], [116.0, 117.39]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 43.82, 44.43, 0.0, 0.0, 82.97, 0.0, 99.73, 83.34, 74.6, 0.0, 59.96, 99.4, 39.15, 44.12, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 21.49], ["cough", 11.68], ["beatboxing", 5.62]], [["speech", 45.62], ["music", 23.69], ["laughter", 4.67]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 48.65], ["insect", 23.4], ["mosquito", 12.5]], [["music", 33.26], ["speech", 16.43], ["livestock, farm animals, working animals", 7.2]], null, null], "duration": [0.84, 4.28, 7.49, 1.19, 0.07, 4.41, 0.36, 3.84, 8.36, 7.54, 0.17, 5.71, 8.86, 12.11, 2.48, 0.27, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/ePRYhNNdzwk_filtered.json b/annotations_filtered/ePRYhNNdzwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..858eaa9bf7356950e006642325d0535a3ca97a14 --- /dev/null +++ b/annotations_filtered/ePRYhNNdzwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.53], [9.0, 9.21], [9.0, 11.04], [26.0, 26.62], [28.0, 29.0], [32.0, 36.98], [39.0, 45.0], [55.0, 56.83], [59.0, 60.13], [65.0, 65.82], [66.0, 67.37], [68.0, 68.52], [76.0, 77.14], [79.0, 80.08], [81.0, 81.09], [90.0, 91.1], [91.0, 91.84], [93.0, 94.49], [98.0, 99.05], [103.0, 103.91], [105.0, 105.9], [112.0, 113.07], [114.0, 114.08], [116.0, 116.41], [118.0, 118.69], [120.0, 120.18], [122.0, 125.27]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.55, 0.0, 35.49, 0.0, 0.0, 34.27, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.16], "audiomae_on_audioset": [[["music", 51.21], ["speech", 26.14], ["boing", 10.9]], null, [["music", 51.81], ["didgeridoo", 16.42], ["musical instrument", 4.11]], null, null, [["music", 34.41], ["throbbing", 14.4], ["hum", 10.33]], [["speech", 43.77], ["creak", 15.53], ["radio", 14.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.47], ["explosion", 13.32], ["burst, pop", 7.35]]], "duration": [5.53, 0.21, 2.04, 0.62, 1.0, 4.98, 6.0, 1.83, 1.13, 0.82, 1.37, 0.52, 1.14, 1.08, 0.09, 1.1, 0.84, 1.49, 1.05, 0.91, 0.9, 1.07, 0.08, 0.41, 0.69, 0.18, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/ePgiRqRIdwg_filtered.json b/annotations_filtered/ePgiRqRIdwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185ca67762f000f58275f0ccb8685bff8e3d2272 --- /dev/null +++ b/annotations_filtered/ePgiRqRIdwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.15], [7.0, 8.7], [11.0, 12.72], [16.0, 16.8], [23.0, 24.6], [33.0, 33.05], [34.0, 35.02], [39.0, 40.26], [42.0, 42.38], [44.0, 44.37], [50.0, 62.8], [80.0, 81.01], [85.0, 85.62], [86.0, 90.26], [91.0, 91.99], [100.0, 101.29], [102.0, 106.57], [107.0, 107.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 31.93, 0.0, 0.0, 49.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["a capella", 20.82], ["music", 17.86], ["mantra", 11.94]], null, null, [["speech", 13.96], ["fart", 12.41], ["livestock, farm animals, working animals", 10.53]], null], "duration": [0.15, 1.7, 1.72, 0.8, 1.6, 0.05, 1.02, 1.26, 0.38, 0.37, 12.8, 1.01, 0.62, 4.26, 0.99, 1.29, 4.57, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/ePlb7b2nQm4_filtered.json b/annotations_filtered/ePlb7b2nQm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b8df92952021a973833d17e4237cbaeacb55bb --- /dev/null +++ b/annotations_filtered/ePlb7b2nQm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.18], [15.0, 20.7], [26.0, 27.46], [32.0, 33.18], [34.0, 34.75], [39.0, 39.29], [40.0, 41.22], [41.0, 42.67], [43.0, 46.5], [47.0, 51.36], [52.0, 53.72], [56.0, 58.67], [66.0, 66.43], [71.0, 71.32], [72.0, 73.2], [75.0, 76.11], [78.0, 83.2], [84.0, 91.88], [93.0, 97.97], [99.0, 119.96], [121.0, 123.58], [130.0, 131.43], [134.0, 135.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [45.95, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 60.7, 0.0, 34.1, 0.0, 0.0, 0.0, 0.0, 47.23, 29.07, 31.15, 29.67, 92.31, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 12.63], ["vehicle", 5.73], ["hum", 5.36]], null, null, null, null, null, null, null, null, null, null, [["speech", 41.26], ["whale vocalization", 11.72], ["music", 6.73]], null, null, null, null, [["fly, housefly", 42.99], ["insect", 28.68], ["bee, wasp, etc.", 17.34]], [["livestock, farm animals, working animals", 30.87], ["cattle, bovinae", 21.41], ["speech", 10.29]], [["speech", 71.72], ["crowd", 7.26], ["outside, urban or manmade", 5.23]], [["music", 27.69], ["hum", 25.08], ["whale vocalization", 13.15]], null, null, null], "duration": [10.18, 5.7, 1.46, 1.18, 0.75, 0.29, 1.22, 1.67, 3.5, 4.36, 1.72, 2.67, 0.43, 0.32, 1.2, 1.11, 5.2, 7.88, 4.97, 20.96, 2.58, 1.43, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/ePtwxRF1WZA_filtered.json b/annotations_filtered/ePtwxRF1WZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5036db55d30df075a7f2676f0928e2dc2982c71c --- /dev/null +++ b/annotations_filtered/ePtwxRF1WZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.88], [22.0, 27.55], [30.0, 35.31], [46.0, 52.15], [53.0, 53.81], [56.0, 64.3], [74.0, 77.18], [81.0, 81.82], [83.0, 85.65], [87.0, 97.7], [103.0, 111.92], [115.0, 122.49], [126.0, 136.07], [140.0, 143.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [31.18, 30.62, 30.81, 30.35, 0.0, 30.84, 31.32, 0.0, 33.95, 30.58, 30.57, 31.66, 30.51, 32.19], "audiomae_on_audioset": [[["speech", 40.99], ["music", 38.09], ["hum", 2.07]], [["music", 52.82], ["speech", 10.63], ["didgeridoo", 6.47]], [["music", 52.84], ["throbbing", 12.33], ["hum", 12.21]], [["music", 67.96], ["speech", 9.6], ["didgeridoo", 2.38]], null, [["throbbing", 58.34], ["music", 17.84], ["hum", 12.38]], [["throbbing", 30.79], ["music", 29.24], ["hum", 17.99]], null, [["music", 58.65], ["boing", 11.9], ["speech", 4.59]], [["music", 40.84], ["hum", 18.1], ["throbbing", 12.89]], [["music", 63.09], ["speech", 12.15], ["throbbing", 5.39]], [["music", 60.71], ["theremin", 9.5], ["hum", 3.05]], [["music", 33.81], ["throbbing", 21.27], ["speech", 9.01]], [["music", 50.64], ["boing", 11.61], ["throbbing", 7.04]]], "duration": [7.88, 5.55, 5.31, 6.15, 0.81, 8.3, 3.18, 0.82, 2.65, 10.7, 8.92, 7.49, 10.07, 3.23]} \ No newline at end of file diff --git a/annotations_filtered/eQ87hBFrS_I_filtered.json b/annotations_filtered/eQ87hBFrS_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1535893539195a068efbf27ac7401062261c92e5 --- /dev/null +++ b/annotations_filtered/eQ87hBFrS_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.64], [12.0, 12.11], [15.0, 15.57], [21.0, 21.78], [27.0, 27.43], [33.0, 34.08], [36.0, 36.26], [37.0, 40.07], [41.0, 41.39], [44.0, 45.22], [49.0, 56.22], [57.0, 57.54], [60.0, 60.62], [64.0, 65.03], [66.0, 67.73], [69.0, 69.35], [79.0, 79.42], [79.0, 79.71], [82.0, 82.54], [83.0, 83.51], [85.0, 85.45], [88.0, 88.67], [91.0, 96.48], [105.0, 114.22], [129.0, 136.38], [139.0, 138.94], [146.0, 146.42], [147.0, 148.09], [153.0, 153.79], [155.0, 157.77], [160.0, 162.8], [164.0, 164.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 37.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.73, 30.23, 32.13, 0.0, 0.0, 0.0, 0.0, 36.09, 33.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 45.93], ["mains hum", 15.29], ["throbbing", 9.36]], null, null, null, null, null, null, null, null, null, null, null, [["music", 50.33], ["hum", 5.31], ["bee, wasp, etc.", 4.69]], [["music", 52.7], ["mains hum", 19.54], ["hum", 11.27]], [["mains hum", 48.21], ["hum", 23.43], ["music", 9.49]], null, null, null, null, [["speech", 44.47], ["sheep", 6.68], ["animal", 6.34]], [["music", 52.53], ["theremin", 27.83], ["musical instrument", 5.76]], null], "duration": [1.64, 0.11, 0.57, 0.78, 0.43, 1.08, 0.26, 3.07, 0.39, 1.22, 7.22, 0.54, 0.62, 1.03, 1.73, 0.35, 0.42, 0.71, 0.54, 0.51, 0.45, 0.67, 5.48, 9.22, 7.38, -0.06, 0.42, 1.09, 0.79, 2.77, 2.8, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/eQ9HJXZI_qU_filtered.json b/annotations_filtered/eQ9HJXZI_qU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c165c548b84c80bc94ed98bed966835f038997b4 --- /dev/null +++ b/annotations_filtered/eQ9HJXZI_qU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.29], [10.0, 11.06], [12.0, 14.93], [18.0, 18.55], [20.0, 21.1], [23.0, 23.77], [26.0, 27.13], [28.0, 29.08], [31.0, 33.2], [34.0, 35.8], [38.0, 39.36], [42.0, 43.11], [47.0, 47.68], [49.0, 49.67], [53.0, 58.31], [60.0, 65.33], [66.0, 69.11], [72.0, 73.18], [77.0, 77.5], [81.0, 81.55], [83.0, 83.67], [85.0, 86.48], [87.0, 87.45], [88.0, 89.38], [99.0, 99.66], [102.0, 103.38], [105.0, 105.88], [109.0, 108.78], [111.0, 112.99], [114.0, 114.61], [118.0, 118.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.89, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.29, 1.06, 2.93, 0.55, 1.1, 0.77, 1.13, 1.08, 2.2, 1.8, 1.36, 1.11, 0.68, 0.67, 5.31, 5.33, 3.11, 1.18, 0.5, 0.55, 0.67, 1.48, 0.45, 1.38, 0.66, 1.38, 0.88, -0.22, 1.99, 0.61, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/eQSqgubHzn0_filtered.json b/annotations_filtered/eQSqgubHzn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66b722f4e4af1395e709e71fb2852958a3413a7c --- /dev/null +++ b/annotations_filtered/eQSqgubHzn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 112.51], [114.0, 114.94]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [33.51, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/eRITzdlHJXA_filtered.json b/annotations_filtered/eRITzdlHJXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..009ed5fea152d0aed481e2435c690c95131719a4 --- /dev/null +++ b/annotations_filtered/eRITzdlHJXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.15], [15.0, 15.89], [16.0, 19.5], [26.0, 26.59], [31.0, 31.9], [33.0, 33.57], [35.0, 36.76], [37.0, 39.48], [48.0, 48.47], [50.0, 51.65], [56.0, 56.51], [58.0, 60.13], [66.0, 66.48], [71.0, 71.69], [80.0, 81.18]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 39.52, 0.0, 0.0, 0.0, 0.0, 39.69, 0.0, 0.0, 0.0, 37.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 29.64], ["music", 28.48], ["rumble", 6.87]], null, null, null, null, [["speech", 42.1], ["music", 12.7], ["mains hum", 6.24]], null, null, null, [["music", 44.86], ["scary music", 8.8], ["speech", 5.43]], null, null, null], "duration": [0.15, 0.89, 3.5, 0.59, 0.9, 0.57, 1.76, 2.48, 0.47, 1.65, 0.51, 2.13, 0.48, 0.69, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/eRNCIg86DKs_filtered.json b/annotations_filtered/eRNCIg86DKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f06c6cfb1b9dfd7dc253513be7ec8ec23ba8d9 --- /dev/null +++ b/annotations_filtered/eRNCIg86DKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [6.0, 6.99], [8.0, 8.13], [15.0, 14.89], [17.0, 17.98], [19.0, 20.41], [21.0, 22.27], [23.0, 24.48], [26.0, 27.85], [43.0, 43.55], [44.0, 44.74], [57.0, 57.72], [60.0, 60.13], [61.0, 61.72], [62.0, 63.56], [65.0, 65.6], [67.0, 67.05], [69.0, 69.38], [72.0, 72.45], [75.0, 76.11], [78.0, 79.56], [80.0, 81.77], [83.0, 83.96], [87.0, 87.64], [90.0, 90.19], [94.0, 94.46], [95.0, 96.16], [99.0, 100.79], [102.0, 102.42], [107.0, 107.6], [110.0, 110.2], [118.0, 118.72], [126.0, 126.27], [127.0, 127.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.99, 0.13, -0.11, 0.98, 1.41, 1.27, 1.48, 1.85, 0.55, 0.74, 0.72, 0.13, 0.72, 1.56, 0.6, 0.05, 0.38, 0.45, 1.11, 1.56, 1.77, 0.96, 0.64, 0.19, 0.46, 1.16, 1.79, 0.42, 0.6, 0.2, 0.72, 0.27, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/eR_BcTP8HOM_filtered.json b/annotations_filtered/eR_BcTP8HOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37f8fb6c209cab450b347f6534decf2f8752115c --- /dev/null +++ b/annotations_filtered/eR_BcTP8HOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.56], [9.0, 10.56], [13.0, 13.04], [13.0, 16.7], [17.0, 16.73], [19.0, 25.02], [34.0, 35.13], [37.0, 47.09], [52.0, 53.3], [64.0, 63.68], [66.0, 67.04], [68.0, 69.08], [75.0, 76.69], [80.0, 80.81], [87.0, 88.89], [89.0, 91.67], [97.0, 97.23], [103.0, 102.96], [124.0, 124.36], [128.0, 128.48], [131.0, 130.91]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.03, 0.0, 96.66, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 25.65], ["moo", 15.86], ["livestock, farm animals, working animals", 14.7]], null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 36.15], ["insect", 35.14], ["bee, wasp, etc.", 9.82]], null, null, null, null, null], "duration": [1.56, 1.56, 0.04, 3.7, -0.27, 6.02, 1.13, 10.09, 1.3, -0.32, 1.04, 1.08, 1.69, 0.81, 1.89, 2.67, 0.23, -0.04, 0.36, 0.48, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/eRqgQiBel8I_filtered.json b/annotations_filtered/eRqgQiBel8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1a5b57ecffde293f61f43db1525824ddb625431 --- /dev/null +++ b/annotations_filtered/eRqgQiBel8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.55], [8.0, 14.79], [18.0, 28.63], [29.0, 30.5], [31.0, 32.73], [34.0, 34.45], [37.0, 36.88], [40.0, 43.77], [46.0, 45.94], [46.0, 46.87], [47.0, 50.3], [55.0, 55.46], [57.0, 62.04], [65.0, 68.98], [69.0, 82.26], [84.0, 92.99], [93.0, 146.84], [148.0, 153.13]], "keep_status": [false, true, true, false, false, false, false, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 38.15, 32.56, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 0.0, 44.34, 0.0, 34.19, 39.12, 37.08, 99.1, 0.0, 86.64], "audiomae_on_audioset": [null, [["speech", 17.11], ["livestock, farm animals, working animals", 16.84], ["cattle, bovinae", 8.26]], [["hum", 29.48], ["mains hum", 24.21], ["speech", 12.21]], null, null, null, null, [["speech", 35.02], ["hum", 12.65], ["music", 10.22]], null, null, [["speech", 24.91], ["hum", 24.0], ["rumble", 9.54]], null, [["fly, housefly", 28.46], ["insect", 21.72], ["bee, wasp, etc.", 13.84]], [["music", 68.92], ["scary music", 4.39], ["didgeridoo", 3.66]], [["buzz", 18.97], ["sound effect", 14.61], ["music", 9.04]], null, null, null], "duration": [1.55, 6.79, 10.63, 1.5, 1.73, 0.45, -0.12, 3.77, -0.06, 0.87, 3.3, 0.46, 5.04, 3.98, 13.26, 8.99, 53.84, 5.13]} \ No newline at end of file diff --git a/annotations_filtered/eS47L5yU2k8_filtered.json b/annotations_filtered/eS47L5yU2k8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d71f2854e7962779cd32776a4118f959f4d27a18 --- /dev/null +++ b/annotations_filtered/eS47L5yU2k8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [8.0, 8.87], [12.0, 12.18], [14.0, 14.61], [18.0, 18.49], [26.0, 25.88], [27.0, 28.12], [28.0, 32.51], [34.0, 34.05], [37.0, 37.76], [40.0, 41.91], [46.0, 46.52], [56.0, 57.92], [61.0, 63.75], [65.0, 67.05], [67.0, 68.62], [81.0, 89.94], [95.0, 95.72]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 52.51, 0.0, 40.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 53.82], ["coin (dropping)", 12.62], ["synthesizer", 3.09]], null, null, null, null, null, null, null, null, [["hum", 36.57], ["mains hum", 21.91], ["music", 15.03]], null], "duration": [0.51, 0.87, 0.18, 0.61, 0.49, -0.12, 1.12, 4.51, 0.05, 0.76, 1.91, 0.52, 1.92, 2.75, 2.05, 1.62, 8.94, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/eSBnFu1YnrU_filtered.json b/annotations_filtered/eSBnFu1YnrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce4e8aa920a265343898a87134ee385854c857f --- /dev/null +++ b/annotations_filtered/eSBnFu1YnrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.57], [13.0, 15.85], [19.0, 19.65], [21.0, 22.05], [25.0, 26.42], [33.0, 34.77], [39.0, 40.61], [42.0, 42.47], [46.0, 47.9], [49.0, 50.45], [53.0, 57.16], [60.0, 61.72], [63.0, 64.4], [69.0, 70.6], [72.0, 73.58], [74.0, 76.1], [77.0, 81.84], [84.0, 84.96], [90.0, 90.85], [92.0, 93.78], [95.0, 96.13], [98.0, 99.5], [100.0, 105.61], [106.0, 106.64], [108.0, 109.05], [112.0, 112.55], [113.0, 114.3], [115.0, 115.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 75.39, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 2.85, 0.65, 1.05, 1.42, 1.77, 1.61, 0.47, 1.9, 1.45, 4.16, 1.72, 1.4, 1.6, 1.58, 2.1, 4.84, 0.96, 0.85, 1.78, 1.13, 1.5, 5.61, 0.64, 1.05, 0.55, 1.3, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/eSYNuO9GTU4_filtered.json b/annotations_filtered/eSYNuO9GTU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..566850918d881bf7bafe3f84fa8ef2db407b7eac --- /dev/null +++ b/annotations_filtered/eSYNuO9GTU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.4], [38.0, 37.93], [38.0, 47.39], [49.0, 51.44], [53.0, 58.23], [59.0, 59.58], [63.0, 70.46], [71.0, 91.0], [92.0, 93.41]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.94, 93.76, 97.33, 0.0, 95.37, 51.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.4, -0.07, 9.39, 2.44, 5.23, 0.58, 7.46, 20.0, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/eSeYw5yaU9A_filtered.json b/annotations_filtered/eSeYw5yaU9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94959f3cf93d4aa7df3726aa99f57fa17a5d13cc --- /dev/null +++ b/annotations_filtered/eSeYw5yaU9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.24], [7.0, 8.4], [24.0, 24.75], [33.0, 33.62], [37.0, 36.78], [49.0, 62.95], [64.0, 65.01], [69.0, 69.92], [76.0, 76.11], [78.0, 79.22], [84.0, 85.89], [100.0, 103.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 1.4, 0.75, 0.62, -0.22, 13.95, 1.01, 0.92, 0.11, 1.22, 1.89, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/eSm68IEDDT0_filtered.json b/annotations_filtered/eSm68IEDDT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9487066939675dbfb9ab3742aaab0bb9773a9fb --- /dev/null +++ b/annotations_filtered/eSm68IEDDT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.2], [4.0, 4.75], [6.0, 7.52], [9.0, 10.61], [13.0, 17.79], [18.0, 27.04], [30.0, 31.58], [33.0, 34.32], [40.0, 43.12], [45.0, 49.25], [50.0, 56.19], [58.0, 63.49], [65.0, 80.03], [83.0, 83.81], [84.0, 88.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 54.63, 0.0, 0.0, 98.44, 60.6, 38.09, 31.04, 97.33, 0.0, 99.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 25.34], ["hum", 9.96], ["mains hum", 4.37]], [["music", 28.93], ["hum", 11.73], ["mains hum", 8.13]], null, null, null], "duration": [1.2, 0.75, 1.52, 1.61, 4.79, 9.04, 1.58, 1.32, 3.12, 4.25, 6.19, 5.49, 15.03, 0.81, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/eT5XhG7qLcU_filtered.json b/annotations_filtered/eT5XhG7qLcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e21b8817bf6f86891919c9df0c1f6b53900c26d --- /dev/null +++ b/annotations_filtered/eT5XhG7qLcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 52.3], [54.0, 57.35], [58.0, 76.79], [78.0, 124.71]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 54.83, 46.54, 0.0], "audiomae_on_audioset": [null, null, [["music", 62.51], ["livestock, farm animals, working animals", 5.01], ["bleat", 4.81]], null], "duration": [45.3, 3.35, 18.79, 46.71]} \ No newline at end of file diff --git a/annotations_filtered/eTVHMQb2OyU_filtered.json b/annotations_filtered/eTVHMQb2OyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad53309242addc3014f4125b7cf285ee0c7aac66 --- /dev/null +++ b/annotations_filtered/eTVHMQb2OyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 5.29], [10.0, 12.26], [15.0, 28.71], [42.0, 43.33], [46.0, 46.53], [48.0, 47.92], [49.0, 53.81], [55.0, 55.32], [62.0, 63.46], [66.0, 68.99], [70.0, 70.82], [74.0, 82.21], [86.0, 91.72], [92.0, 91.89], [92.0, 91.96], [92.0, 94.15], [96.0, 96.9], [98.0, 98.63], [99.0, 98.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 30.25, 30.37, 0.0, 0.0, 0.0, 42.74, 0.0, 0.0, 44.49, 0.0, 86.27, 40.38, 0.0, 0.0, 37.57, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 34.81], ["livestock, farm animals, working animals", 33.98], ["moo", 20.14]], [["livestock, farm animals, working animals", 37.04], ["cattle, bovinae", 30.23], ["moo", 20.8]], null, null, null, [["whale vocalization", 49.3], ["livestock, farm animals, working animals", 15.27], ["moo", 14.22]], null, null, [["radio", 57.78], ["speech", 26.24], ["sidetone", 6.83]], null, null, [["speech", 44.33], ["music", 14.79], ["hum", 5.16]], null, null, [["music", 29.32], ["fart", 12.56], ["foghorn", 8.46]], null, null, null], "duration": [1.3, 0.29, 2.26, 13.71, 1.33, 0.53, -0.08, 4.81, 0.32, 1.46, 2.99, 0.82, 8.21, 5.72, -0.11, -0.04, 2.15, 0.9, 0.63, -0.29]} \ No newline at end of file diff --git a/annotations_filtered/eTeBFTlR0VI_filtered.json b/annotations_filtered/eTeBFTlR0VI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce5d88e1349083d82b6d646398421c4e70e7a784 --- /dev/null +++ b/annotations_filtered/eTeBFTlR0VI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.1], [26.0, 32.71], [34.0, 47.95], [48.0, 79.3], [80.0, 91.42], [94.0, 94.69], [98.0, 113.71], [115.0, 116.19], [118.0, 124.66], [126.0, 137.05], [139.0, 142.11], [143.0, 142.94]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [41.76, 39.83, 31.17, 0.0, 64.07, 0.0, 95.37, 0.0, 99.87, 99.9, 99.93, 0.0], "audiomae_on_audioset": [[["whale vocalization", 58.08], ["speech", 13.7], ["music", 11.86]], [["music", 32.98], ["grunt", 29.34], ["scary music", 10.54]], [["music", 45.06], ["buzz", 4.92], ["speech", 3.63]], null, null, null, null, null, null, null, null, null], "duration": [4.1, 6.71, 13.95, 31.3, 11.42, 0.69, 15.71, 1.19, 6.66, 11.05, 3.11, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/eTepvIyKhIo_filtered.json b/annotations_filtered/eTepvIyKhIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..549e313637fe74765937a54ec6216a1c79dc5ed7 --- /dev/null +++ b/annotations_filtered/eTepvIyKhIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [6.0, 8.24], [10.0, 20.04], [24.0, 34.77], [36.0, 83.17], [86.0, 88.72], [89.0, 162.87]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [0.0, 94.22, 42.39, 34.33, 0.0, 35.84, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.07], ["speech", 24.93], ["hum", 5.04]], [["music", 21.04], ["rumble", 14.08], ["sonar", 6.84]], null, [["speech", 30.36], ["sidetone", 25.65], ["music", 13.69]], null], "duration": [1.26, 2.24, 10.04, 10.77, 47.17, 2.72, 73.87]} \ No newline at end of file diff --git a/annotations_filtered/eU4-wIieuWU_filtered.json b/annotations_filtered/eU4-wIieuWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ade88518da8669469005def5dded8e58cfcc1b3a --- /dev/null +++ b/annotations_filtered/eU4-wIieuWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.88], [13.0, 13.91], [18.0, 18.86], [20.0, 20.38], [23.0, 23.84], [27.0, 27.01], [33.0, 34.21], [35.0, 35.9], [37.0, 37.22], [40.0, 41.0], [47.0, 47.41], [52.0, 53.67], [56.0, 56.39], [60.0, 60.24], [64.0, 67.8], [72.0, 73.38], [75.0, 76.62], [80.0, 80.7], [85.0, 85.5], [87.0, 87.18], [92.0, 93.36], [100.0, 103.01], [103.0, 104.38], [109.0, 110.22], [114.0, 117.85], [120.0, 120.34], [123.0, 123.26], [125.0, 125.81], [128.0, 128.16], [130.0, 130.79], [133.0, 134.4], [140.0, 140.53], [143.0, 144.05], [148.0, 149.12], [154.0, 155.68], [157.0, 157.96], [159.0, 163.38], [165.0, 165.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.91, 0.86, 0.38, 0.84, 0.01, 1.21, 0.9, 0.22, 1.0, 0.41, 1.67, 0.39, 0.24, 3.8, 1.38, 1.62, 0.7, 0.5, 0.18, 1.36, 3.01, 1.38, 1.22, 3.85, 0.34, 0.26, 0.81, 0.16, 0.79, 1.4, 0.53, 1.05, 1.12, 1.68, 0.96, 4.38, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/eUNWIKp6nR4_filtered.json b/annotations_filtered/eUNWIKp6nR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92e07c9c06075e3655c52a8d17dceb42e84ddd39 --- /dev/null +++ b/annotations_filtered/eUNWIKp6nR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.64], [34.0, 34.77], [39.0, 40.74], [47.0, 56.13], [57.0, 62.26], [66.0, 67.98], [76.0, 77.58], [79.0, 79.44], [80.0, 82.14], [84.0, 84.27], [86.0, 87.02], [89.0, 89.7], [93.0, 93.95], [95.0, 98.42], [100.0, 100.62], [102.0, 102.86], [106.0, 106.81], [108.0, 110.05], [111.0, 112.99], [115.0, 116.6], [118.0, 118.69]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.41, 0.0, 0.0, 54.04, 68.67, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.45], ["crowd", 11.87], ["applause", 11.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.77, 1.74, 9.13, 5.26, 1.98, 1.58, 0.44, 2.14, 0.27, 1.02, 0.7, 0.95, 3.42, 0.62, 0.86, 0.81, 2.05, 1.99, 1.6, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/eUogxXRPC7E_filtered.json b/annotations_filtered/eUogxXRPC7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdee989d55bcaffb73827bfbafebbd41408711bc --- /dev/null +++ b/annotations_filtered/eUogxXRPC7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [11.0, 10.54], [11.0, 20.19], [27.0, 27.68], [29.0, 30.15], [42.0, 42.92], [45.0, 45.89], [46.0, 46.57], [48.0, 48.03], [52.0, 84.82], [85.0, 86.04], [87.0, 89.06], [90.0, 103.76], [107.0, 111.75]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 99.62, 99.73], "audiomae_on_audioset": [null, null, [["music", 56.68], ["didgeridoo", 8.57], ["cattle, bovinae", 4.55]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, -0.46, 9.19, 0.68, 1.15, 0.92, 0.89, 0.57, 0.03, 32.82, 1.04, 2.06, 13.76, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/eVJhlVgr9lM_filtered.json b/annotations_filtered/eVJhlVgr9lM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb1b913449a270be5a22f1a3d2daeee9d9e7987 --- /dev/null +++ b/annotations_filtered/eVJhlVgr9lM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.92], [10.0, 89.55]], "keep_status": [false, false], "silence_prob": [99.92, 0.0], "audiomae_on_audioset": [null, null], "duration": [7.92, 79.55]} \ No newline at end of file diff --git a/annotations_filtered/eVUsVW87kSk_filtered.json b/annotations_filtered/eVUsVW87kSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74c9aef2f4ce6ea69a7ee0c7821491c75221a087 --- /dev/null +++ b/annotations_filtered/eVUsVW87kSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 101.65], [102.0, 122.25], [125.0, 125.58], [127.0, 128.34]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 55.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [98.65, 20.25, 0.58, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/eVarVWL4PwA_filtered.json b/annotations_filtered/eVarVWL4PwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e4798c27c0db1183130e3d0b6349492d7144139 --- /dev/null +++ b/annotations_filtered/eVarVWL4PwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.41], [34.0, 36.64], [37.0, 37.52], [39.0, 40.71], [44.0, 48.47], [50.0, 63.56], [64.0, 70.56], [75.0, 76.57]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [0.0, 73.97, 0.0, 0.0, 70.58, 48.23, 36.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 14.14], ["noise", 13.47], ["music", 11.44]], [["gong", 21.48], ["hum", 14.66], ["speech", 11.07]], null], "duration": [0.41, 2.64, 0.52, 1.71, 4.47, 13.56, 6.56, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/eVmYZJQxawo_filtered.json b/annotations_filtered/eVmYZJQxawo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0d37ad54fb13933612d683eca5a7c536438067 --- /dev/null +++ b/annotations_filtered/eVmYZJQxawo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 28.85], [36.0, 36.53], [37.0, 37.61], [47.0, 48.24], [50.0, 49.77], [51.0, 64.83], [66.0, 88.37], [96.0, 97.04], [98.0, 105.21], [112.0, 118.3], [123.0, 134.76], [136.0, 137.83], [145.0, 146.72], [153.0, 181.8], [187.0, 186.8]], "keep_status": [true, false, false, false, false, true, false, false, true, true, true, false, false, false, false], "silence_prob": [30.72, 0.0, 0.0, 0.0, 0.0, 29.89, 30.21, 0.0, 30.0, 33.3, 32.44, 0.0, 0.0, 29.52, 0.0], "audiomae_on_audioset": [[["music", 43.36], ["speech", 15.65], ["didgeridoo", 8.12]], null, null, null, null, [["music", 39.17], ["breaking", 18.45], ["hum", 5.3]], [["music", 49.69], ["theremin", 27.76], ["musical instrument", 2.8]], null, [["music", 46.68], ["speech", 7.56], ["throbbing", 7.36]], [["music", 46.23], ["foghorn", 8.76], ["didgeridoo", 6.03]], [["music", 25.08], ["moo", 13.72], ["cattle, bovinae", 12.34]], null, null, [["music", 89.22], ["musical instrument", 2.26], ["brass instrument", 1.17]], null], "duration": [25.85, 0.53, 0.61, 1.24, -0.23, 13.83, 22.37, 1.04, 7.21, 6.3, 11.76, 1.83, 1.72, 28.8, -0.2]} \ No newline at end of file diff --git a/annotations_filtered/eVzxDwu506A_filtered.json b/annotations_filtered/eVzxDwu506A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a3dafb2e935dee27bc887101157ea30679c020a --- /dev/null +++ b/annotations_filtered/eVzxDwu506A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.18], [23.0, 23.73], [33.0, 33.98], [35.0, 34.94], [44.0, 47.31], [50.0, 57.86], [58.0, 59.91], [63.0, 62.78], [63.0, 62.83], [65.0, 91.18], [92.0, 94.17], [96.0, 101.17], [104.0, 107.97], [108.0, 110.81], [115.0, 115.65]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.92, 29.18, 0.0, 0.0, 0.0, 28.89, 44.81, 30.15, 31.07, 44.63, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 50.86], ["horse", 9.33], ["music", 9.21]], [["music", 56.31], ["speech", 14.22], ["smash, crash", 2.84]], null, null, null, [["music", 24.84], ["speech", 19.02], ["livestock, farm animals, working animals", 14.92]], [["throbbing", 16.82], ["noise", 12.4], ["hum", 5.69]], [["breaking", 24.97], ["car alarm", 17.56], ["cattle, bovinae", 11.66]], [["speech", 18.76], ["whack, thwack", 14.26], ["explosion", 7.08]], [["noise", 19.93], ["speech", 13.11], ["sidetone", 10.68]], null], "duration": [0.18, 0.73, 0.98, -0.06, 3.31, 7.86, 1.91, -0.22, -0.17, 26.18, 2.17, 5.17, 3.97, 2.81, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/eWL0obbYYOE_filtered.json b/annotations_filtered/eWL0obbYYOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a13a5cfbc8224d7ef14bd6b38f807e03b6931a5 --- /dev/null +++ b/annotations_filtered/eWL0obbYYOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [4.0, 4.92], [6.0, 6.74], [11.0, 10.84], [15.0, 15.38], [16.0, 20.61], [26.0, 26.5], [56.0, 56.67], [61.0, 61.96], [73.0, 74.65], [83.0, 82.98], [84.0, 84.32], [91.0, 93.7], [96.0, 96.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.92, 0.74, -0.16, 0.38, 4.61, 0.5, 0.67, 0.96, 1.65, -0.02, 0.32, 2.7, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/eWP8JMcy3O0_filtered.json b/annotations_filtered/eWP8JMcy3O0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbae7e77b1ef787ee8f9771b237a32a085449a97 --- /dev/null +++ b/annotations_filtered/eWP8JMcy3O0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.71], [7.0, 11.92], [21.0, 20.98], [24.0, 24.09], [28.0, 28.7], [29.0, 31.13], [32.0, 33.22], [38.0, 39.24], [45.0, 45.37], [51.0, 51.65], [53.0, 54.43], [55.0, 55.46], [59.0, 61.96], [63.0, 64.59], [67.0, 68.44], [70.0, 70.6], [77.0, 77.58], [79.0, 79.64], [87.0, 88.5], [96.0, 96.8], [100.0, 100.4], [105.0, 105.54], [109.0, 109.44], [116.0, 116.88], [117.0, 126.84], [131.0, 132.22], [134.0, 134.5], [135.0, 135.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.91, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["wail, moan", 81.33], ["gasp", 5.07], ["speech", 3.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.6], ["beatboxing", 12.33], ["music", 3.68]], null, null, null], "duration": [0.71, 4.92, -0.02, 0.09, 0.7, 2.13, 1.22, 1.24, 0.37, 0.65, 1.43, 0.46, 2.96, 1.59, 1.44, 0.6, 0.58, 0.64, 1.5, 0.8, 0.4, 0.54, 0.44, 0.88, 9.84, 1.22, 0.5, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/eWgOjuLg5oY_filtered.json b/annotations_filtered/eWgOjuLg5oY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb60c80e3b7991f78cb58710942c19d90bb39760 --- /dev/null +++ b/annotations_filtered/eWgOjuLg5oY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [16.0, 17.29], [20.0, 25.95], [27.0, 71.51], [73.0, 75.47], [77.0, 78.11], [82.0, 83.0], [85.0, 88.92], [90.0, 93.14], [94.0, 95.2], [96.0, 97.61], [99.0, 98.86], [101.0, 101.51], [102.0, 106.2], [111.0, 110.73], [111.0, 125.2], [127.0, 127.68], [128.0, 127.75], [128.0, 132.24], [135.0, 136.22], [137.0, 138.54], [142.0, 149.22], [151.0, 151.48], [155.0, 154.99], [157.0, 159.09], [160.0, 164.42], [169.0, 179.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.02, 0.0, 99.93, 0.0, 0.0, 100.0, 98.99, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 59.96, 0.0, 0.0, 99.59, 0.0, 0.0, 97.22, 0.0, 0.0, 99.16, 47.31, 44.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.79], ["speech", 11.84], ["theremin", 10.47]], [["music", 79.47], ["theremin", 7.32], ["musical instrument", 2.29]]], "duration": [0.97, 1.29, 5.95, 44.51, 2.47, 1.11, 1.0, 3.92, 3.14, 1.2, 1.61, -0.14, 0.51, 4.2, -0.27, 14.2, 0.68, -0.25, 4.24, 1.22, 1.54, 7.22, 0.48, -0.01, 2.09, 4.42, 10.15]} \ No newline at end of file diff --git a/annotations_filtered/eWirsPiHnA0_filtered.json b/annotations_filtered/eWirsPiHnA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b583d6545ff00b185a266286da797ff2075457f --- /dev/null +++ b/annotations_filtered/eWirsPiHnA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.51], [14.0, 15.21], [16.0, 16.44], [19.0, 38.5], [41.0, 50.52], [54.0, 58.51], [60.0, 68.32], [69.0, 75.2], [78.0, 78.06], [80.0, 87.96], [91.0, 101.61], [103.0, 106.19], [109.0, 130.5], [131.0, 165.18]], "keep_status": [true, false, false, true, true, false, false, true, false, false, false, false, false, false], "silence_prob": [35.05, 0.0, 0.0, 40.24, 37.45, 97.0, 95.51, 34.25, 0.0, 95.91, 35.59, 66.27, 40.5, 0.0], "audiomae_on_audioset": [[["speech", 15.31], ["explosion", 11.82], ["whack, thwack", 10.96]], null, null, [["speech", 56.14], ["animal", 5.3], ["explosion", 4.13]], [["speech", 58.22], ["gunshot, gunfire", 5.96], ["explosion", 4.55]], null, null, [["music", 39.36], ["speech", 10.25], ["gunshot, gunfire", 7.22]], null, null, [["glass", 40.67], ["breaking", 21.21], ["music", 12.35]], null, [["speech", 68.47], ["music", 11.93], ["explosion", 2.01]], null], "duration": [6.51, 1.21, 0.44, 19.5, 9.52, 4.51, 8.32, 6.2, 0.06, 7.96, 10.61, 3.19, 21.5, 34.18]} \ No newline at end of file diff --git a/annotations_filtered/eWmiv9uIXQk_filtered.json b/annotations_filtered/eWmiv9uIXQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..964480dc1ee462091207d8334946d80b621104d9 --- /dev/null +++ b/annotations_filtered/eWmiv9uIXQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 44.27], [47.0, 107.25], [107.0, 110.12]], "keep_status": [false, false, false], "silence_prob": [30.74, 0.0, 30.99], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 60.6], ["cattle, bovinae", 18.75], ["moo", 8.7]], null, [["whale vocalization", 93.69], ["animal", 2.55], ["roaring cats (lions, tigers)", 1.13]]], "duration": [7.27, 60.25, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/eX3czjlDO5w_filtered.json b/annotations_filtered/eX3czjlDO5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..196c91d4df4d8ac4cccee65867ed4042bab9d75c --- /dev/null +++ b/annotations_filtered/eX3czjlDO5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.97], [13.0, 13.26], [14.0, 17.81], [20.0, 20.7], [21.0, 22.91], [23.0, 25.08], [25.0, 26.37], [28.0, 30.37], [36.0, 39.77]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.52, 0.0, 0.0, 50.81, 0.0, 41.1, 53.72], "audiomae_on_audioset": [null, null, [["speech", 53.67], ["sidetone", 28.48], ["sine wave", 3.82]], null, null, null, null, [["sidetone", 46.76], ["speech", 34.3], ["sine wave", 5.34]], null], "duration": [-0.03, 0.26, 3.81, 0.7, 1.91, 2.08, 1.37, 2.37, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/eXHdqulNiBs_filtered.json b/annotations_filtered/eXHdqulNiBs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf468c7b41e58220141f460cc511687064d56487 --- /dev/null +++ b/annotations_filtered/eXHdqulNiBs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.32], [19.0, 36.76], [40.0, 46.82], [49.0, 54.26], [55.0, 60.44], [61.0, 89.85], [94.0, 96.35], [102.0, 111.84], [117.0, 137.51]], "keep_status": [false, false, true, true, false, true, false, true, true], "silence_prob": [0.0, 30.38, 29.52, 39.8, 29.74, 30.27, 37.09, 28.48, 32.06], "audiomae_on_audioset": [null, [["music", 82.97], ["musical instrument", 2.68], ["guitar", 1.53]], [["music", 42.24], ["boing", 10.69], ["speech", 7.68]], [["music", 38.5], ["throbbing", 13.66], ["hum", 10.87]], [["music", 56.26], ["smash, crash", 13.29], ["throbbing", 5.1]], [["speech", 35.17], ["music", 29.26], ["hum", 3.62]], [["music", 70.75], ["throbbing", 5.06], ["hum", 2.69]], [["music", 47.51], ["throbbing", 5.82], ["pulse", 4.5]], [["music", 31.27], ["throbbing", 22.26], ["hum", 13.24]]], "duration": [1.32, 17.76, 6.82, 5.26, 5.44, 28.85, 2.35, 9.84, 20.51]} \ No newline at end of file diff --git a/annotations_filtered/eXVVSJUhDmo_filtered.json b/annotations_filtered/eXVVSJUhDmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b8d7e8c9ed5d6ef3ccb934ca73a3d7cc40a2d2 --- /dev/null +++ b/annotations_filtered/eXVVSJUhDmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.62], [7.0, 8.07], [11.0, 13.98], [16.0, 17.12], [23.0, 23.85], [26.0, 26.45], [27.0, 27.33], [29.0, 29.51], [31.0, 39.43], [46.0, 46.89], [47.0, 47.63], [49.0, 50.79], [54.0, 54.97], [68.0, 68.54], [77.0, 77.33], [78.0, 82.78], [84.0, 89.67], [93.0, 94.42], [95.0, 95.01], [108.0, 108.87], [111.0, 112.38], [114.0, 114.2], [118.0, 118.77], [123.0, 124.75], [129.0, 129.51], [133.0, 133.02], [136.0, 136.8], [137.0, 137.84], [138.0, 138.65], [144.0, 146.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.07, 2.98, 1.12, 0.85, 0.45, 0.33, 0.51, 8.43, 0.89, 0.63, 1.79, 0.97, 0.54, 0.33, 4.78, 5.67, 1.42, 0.01, 0.87, 1.38, 0.2, 0.77, 1.75, 0.51, 0.02, 0.8, 0.84, 0.65, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/eYJYW_9mFVg_filtered.json b/annotations_filtered/eYJYW_9mFVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b60a98d1b597d2dff6fe56dce928aec3ba3ab83 --- /dev/null +++ b/annotations_filtered/eYJYW_9mFVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.0], [14.0, 14.25], [19.0, 20.46], [38.0, 38.48], [51.0, 52.73], [54.0, 54.45], [57.0, 59.37], [68.0, 72.59], [73.0, 117.09], [118.0, 118.93], [122.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.03, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 54.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 62.74], ["hum", 7.32], ["clip-clop", 4.48]], null, null, null, null, null, null, null, null, null, null], "duration": [8.0, 0.25, 1.46, 0.48, 1.73, 0.45, 2.37, 4.59, 44.09, 0.93, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/eYMbAHC6RxU_filtered.json b/annotations_filtered/eYMbAHC6RxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..725fbd5140725da146c8b45f63b8917d317cd023 --- /dev/null +++ b/annotations_filtered/eYMbAHC6RxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.27], [16.0, 17.02], [18.0, 21.68], [24.0, 25.15], [26.0, 27.89], [30.0, 32.37], [33.0, 34.67], [35.0, 36.44], [38.0, 41.49], [43.0, 48.63], [49.0, 49.76], [50.0, 52.02], [53.0, 53.16], [54.0, 60.81], [62.0, 64.05], [65.0, 65.7], [67.0, 69.4], [69.0, 69.79], [70.0, 75.05], [77.0, 78.75], [81.0, 80.99], [81.0, 83.17], [85.0, 85.95], [88.0, 89.26], [90.0, 94.78], [96.0, 96.38], [98.0, 103.44], [105.0, 111.55], [115.0, 115.47], [116.0, 117.68], [120.0, 122.59], [125.0, 126.39], [127.0, 131.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 89.54, 99.59, 0.0, 100.0, 0.0, 99.98, 100.0, 0.0, 91.47, 0.0, 95.64, 0.0, 0.0, 73.51, 0.0, 0.0, 100.0, 0.0, 98.36, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.27, 1.02, 3.68, 1.15, 1.89, 2.37, 1.67, 1.44, 3.49, 5.63, 0.76, 2.02, 0.16, 6.81, 2.05, 0.7, 2.4, 0.79, 5.05, 1.75, -0.01, 2.17, 0.95, 1.26, 4.78, 0.38, 5.44, 6.55, 0.47, 1.68, 2.59, 1.39, 4.45]} \ No newline at end of file diff --git a/annotations_filtered/eYrt5n8DA2M_filtered.json b/annotations_filtered/eYrt5n8DA2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb5c7952009c3696674c94d8b7d6f91e61e0f65 --- /dev/null +++ b/annotations_filtered/eYrt5n8DA2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.05], [8.0, 13.09], [13.0, 15.08], [16.0, 16.38], [17.0, 17.95], [21.0, 21.83], [23.0, 30.52], [31.0, 34.13], [36.0, 36.9], [37.0, 39.55], [40.0, 41.15], [42.0, 43.11], [44.0, 43.78], [45.0, 106.02], [108.0, 119.43], [120.0, 124.63], [125.0, 141.22], [142.0, 146.87], [147.0, 158.21], [159.0, 161.5], [162.0, 172.12], [173.0, 175.42]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false], "silence_prob": [100.0, 43.13, 37.57, 0.0, 0.0, 0.0, 89.54, 34.19, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 30.1, 99.97, 38.46, 100.0, 29.68, 43.66, 28.06, 30.86], "audiomae_on_audioset": [null, [["sidetone", 27.96], ["sine wave", 17.31], ["dial tone", 13.82]], [["sidetone", 32.88], ["speech", 19.7], ["busy signal", 9.67]], null, null, null, null, [["speech", 41.96], ["animal", 10.32], ["domestic animals, pets", 8.12]], null, null, null, null, null, null, [["music", 12.12], ["rumble", 11.8], ["sonar", 3.79]], null, [["whale vocalization", 12.72], ["sidetone", 11.94], ["boing", 8.95]], null, [["speech", 26.51], ["burst, pop", 8.12], ["beep, bleep", 7.06]], [["sidetone", 57.63], ["hum", 11.21], ["speech", 4.96]], [["speech", 61.63], ["screaming", 8.58], ["burst, pop", 5.8]], [["moo", 35.69], ["cattle, bovinae", 30.78], ["speech", 8.69]]], "duration": [4.05, 5.09, 2.08, 0.38, 0.95, 0.83, 7.52, 3.13, 0.9, 2.55, 1.15, 1.11, -0.22, 61.02, 11.43, 4.63, 16.22, 4.87, 11.21, 2.5, 10.12, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/eYx5m_iT-1U_filtered.json b/annotations_filtered/eYx5m_iT-1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1c6d75554ea98631aee9e7efc0edf2550b7468a --- /dev/null +++ b/annotations_filtered/eYx5m_iT-1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [12.0, 12.18], [14.0, 14.66], [15.0, 16.17], [19.0, 19.47], [22.0, 23.23], [25.0, 25.14], [27.0, 30.01], [32.0, 33.72], [35.0, 37.88], [43.0, 43.78], [45.0, 44.95], [46.0, 46.21], [48.0, 50.11], [51.0, 51.34], [53.0, 53.52], [54.0, 65.13], [68.0, 93.46], [95.0, 99.74], [103.0, 106.27], [108.0, 108.06], [113.0, 118.0]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 36.67, 0.0, 0.0, 0.0, 44.23, 0.0, 0.0, 31.93, 34.34, 39.27, 44.32, 0.0, 71.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["grunt", 27.31], ["whack, thwack", 11.43], ["speech", 7.18]], null, null, null, [["music", 26.39], ["electronic music", 5.92], ["ambient music", 4.41]], null, null, [["speech", 38.26], ["music", 31.18], ["whack, thwack", 7.77]], [["music", 51.09], ["fart", 12.85], ["boing", 9.19]], [["music", 26.11], ["speech", 23.76], ["fart", 13.82]], [["noise", 45.89], ["burping, eructation", 12.01], ["speech", 9.58]], null, null], "duration": [0.21, 0.18, 0.66, 1.17, 0.47, 1.23, 0.14, 3.01, 1.72, 2.88, 0.78, -0.05, 0.21, 2.11, 0.34, 0.52, 11.13, 25.46, 4.74, 3.27, 0.06, 5.0]} \ No newline at end of file diff --git a/annotations_filtered/eZ64IFqMQuQ_filtered.json b/annotations_filtered/eZ64IFqMQuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96986b9e393f063441353856fc3fe10ce5a4e8d9 --- /dev/null +++ b/annotations_filtered/eZ64IFqMQuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.52], [18.0, 19.41], [23.0, 23.79], [27.0, 28.31], [38.0, 38.6], [40.0, 41.32], [50.0, 52.12], [54.0, 54.68], [56.0, 56.84], [58.0, 58.67], [61.0, 62.24], [65.0, 65.55], [69.0, 69.89], [73.0, 73.89], [75.0, 76.47], [80.0, 80.37], [89.0, 89.04], [92.0, 92.97], [97.0, 97.6], [106.0, 107.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 1.41, 0.79, 1.31, 0.6, 1.32, 2.12, 0.68, 0.84, 0.67, 1.24, 0.55, 0.89, 0.89, 1.47, 0.37, 0.04, 0.97, 0.6, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/eZWHAM2EG3o_filtered.json b/annotations_filtered/eZWHAM2EG3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f0b7d59c4754644f4f1d3030c3c5939c016fc8 --- /dev/null +++ b/annotations_filtered/eZWHAM2EG3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.92], [10.0, 10.52]], "keep_status": [false, false], "silence_prob": [66.39, 0.0], "audiomae_on_audioset": [null, null], "duration": [4.92, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/eZXgYKx0aQI_filtered.json b/annotations_filtered/eZXgYKx0aQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bd4d570b293e092b54cee585a008a1c212e25bd --- /dev/null +++ b/annotations_filtered/eZXgYKx0aQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.95], [3.0, 4.77], [7.0, 9.61], [17.0, 17.74], [18.0, 19.26], [22.0, 23.09], [27.0, 27.48], [31.0, 31.11], [34.0, 34.37], [45.0, 45.35], [51.0, 53.33], [56.0, 56.25], [64.0, 64.1], [68.0, 68.94], [75.0, 75.27], [80.0, 80.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 1.77, 2.61, 0.74, 1.26, 1.09, 0.48, 0.11, 0.37, 0.35, 2.33, 0.25, 0.1, 0.94, 0.27, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/eZc3GMgzwyk_filtered.json b/annotations_filtered/eZc3GMgzwyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680948c6c43ad180ebb660d0df87b8163ed643a5 --- /dev/null +++ b/annotations_filtered/eZc3GMgzwyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.51], [31.0, 35.58], [40.0, 50.9], [51.0, 51.92], [53.0, 60.44], [65.0, 77.21], [78.0, 78.98], [85.0, 85.5], [87.0, 87.96], [89.0, 90.12], [90.0, 92.16], [93.0, 93.02]], "keep_status": [true, true, true, false, true, true, false, false, false, false, false, false], "silence_prob": [33.0, 32.88, 33.0, 0.0, 32.82, 32.73, 0.0, 0.0, 0.0, 0.0, 50.21, 0.0], "audiomae_on_audioset": [[["music", 22.26], ["synthesizer", 15.56], ["buzz", 9.36]], [["music", 18.16], ["speech", 11.42], ["fly, housefly", 5.09]], [["music", 51.93], ["cacophony", 4.37], ["speech", 3.42]], null, [["music", 26.43], ["vehicle", 18.6], ["speech", 8.04]], [["music", 29.26], ["cattle, bovinae", 9.61], ["moo", 8.75]], null, null, null, null, null, null], "duration": [10.51, 4.58, 10.9, 0.92, 7.44, 12.21, 0.98, 0.5, 0.96, 1.12, 2.16, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/eZp6EmVqq5o_filtered.json b/annotations_filtered/eZp6EmVqq5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..849230fd26b7eec71118ca281072b4dffc12bf77 --- /dev/null +++ b/annotations_filtered/eZp6EmVqq5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [4.0, 5.54], [8.0, 9.15], [11.0, 61.5], [66.0, 67.66], [71.0, 71.54], [76.0, 76.89], [87.0, 87.34], [90.0, 90.88], [94.0, 96.36], [99.0, 99.54], [100.0, 100.84], [105.0, 105.26], [108.0, 107.94], [114.0, 114.47], [116.0, 117.8], [118.0, 120.06], [122.0, 123.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 1.54, 1.15, 50.5, 1.66, 0.54, 0.89, 0.34, 0.88, 2.36, 0.54, 0.84, 0.26, -0.06, 0.47, 1.8, 2.06, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/eZtQn-GAemQ_filtered.json b/annotations_filtered/eZtQn-GAemQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79d152d6a4affb89658db3dfb5ddbc3bdf4bdd1a --- /dev/null +++ b/annotations_filtered/eZtQn-GAemQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [5.0, 6.18], [7.0, 8.06], [9.0, 9.86], [21.0, 29.49], [30.0, 32.16], [33.0, 33.15], [34.0, 34.48], [35.0, 39.39], [40.0, 40.37], [41.0, 44.22], [45.0, 50.04], [51.0, 55.14], [56.0, 56.3], [60.0, 61.6], [62.0, 64.4], [65.0, 66.06], [67.0, 67.1], [68.0, 68.98], [69.0, 69.52], [72.0, 75.36], [76.0, 77.19], [78.0, 78.78], [85.0, 85.89], [92.0, 92.18], [94.0, 94.71], [103.0, 103.4], [105.0, 105.6], [109.0, 111.65], [113.0, 114.08], [118.0, 121.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 70.58, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 1.18, 1.06, 0.86, 8.49, 2.16, 0.15, 0.48, 4.39, 0.37, 3.22, 5.04, 4.14, 0.3, 1.6, 2.4, 1.06, 0.1, 0.98, 0.52, 3.36, 1.19, 0.78, 0.89, 0.18, 0.71, 0.4, 0.6, 2.65, 1.08, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/e_S58iPZYu8_filtered.json b/annotations_filtered/e_S58iPZYu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd7266a6ecbc78b61b11249ef27207663f579b64 --- /dev/null +++ b/annotations_filtered/e_S58iPZYu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.91], [19.0, 20.01], [23.0, 23.26], [28.0, 28.7], [31.0, 36.0], [48.0, 48.68], [49.0, 63.15], [67.0, 70.33], [71.0, 71.86], [73.0, 115.8], [117.0, 118.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 53.84, 55.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 1.01, 0.26, 0.7, 5.0, 0.68, 14.15, 3.33, 0.86, 42.8, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/ealJoNJuKnY_filtered.json b/annotations_filtered/ealJoNJuKnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc87d009b7ec0bc6c6ad724db4b249505680581c --- /dev/null +++ b/annotations_filtered/ealJoNJuKnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.71], [7.0, 8.36], [9.0, 10.0], [12.0, 16.34], [17.0, 17.91], [35.0, 36.39], [37.0, 37.88], [40.0, 41.45], [45.0, 45.23], [51.0, 50.77], [52.0, 53.91], [60.0, 60.89], [69.0, 71.34], [79.0, 80.13], [81.0, 81.78], [89.0, 89.9], [93.0, 95.17], [96.0, 97.21], [98.0, 100.99], [102.0, 105.63], [108.0, 112.13], [112.0, 115.32], [117.0, 119.62], [121.0, 124.02], [125.0, 126.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.36, 0.0, 0.0, 0.0, 43.2, 0.0, 49.18, 100.0, 98.19, 61.97, 99.05, 63.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 21.81], ["hum", 21.74], ["mechanisms", 15.87]], null, null, null, [["speech", 34.86], ["music", 18.73], ["telephone", 4.79]], null, [["speech", 56.02], ["echo", 23.0], ["reverberation", 3.21]], null, null, null, null, null, null], "duration": [1.71, 1.36, 1.0, 4.34, 0.91, 1.39, 0.88, 1.45, 0.23, -0.23, 1.91, 0.89, 2.34, 1.13, 0.78, 0.9, 2.17, 1.21, 2.99, 3.63, 4.13, 3.32, 2.62, 3.02, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/eb46yXP211w_filtered.json b/annotations_filtered/eb46yXP211w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f21bef4b7fd97b46929a14e6cd5fd9a4826bfe90 --- /dev/null +++ b/annotations_filtered/eb46yXP211w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.48], [14.0, 34.72], [38.0, 39.45], [40.0, 41.47], [42.0, 42.77], [43.0, 43.92], [46.0, 46.92], [51.0, 52.24], [54.0, 56.46], [58.0, 57.72], [58.0, 59.46], [76.0, 76.32], [84.0, 85.72], [90.0, 90.96], [91.0, 91.71], [100.0, 99.87], [102.0, 102.69], [106.0, 110.89], [114.0, 114.2], [118.0, 118.93], [125.0, 127.36], [129.0, 129.61], [130.0, 132.63], [135.0, 137.59], [139.0, 139.7], [145.0, 145.91], [152.0, 152.61], [154.0, 153.96], [165.0, 165.82]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.47, 48.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.54, 0.0, 0.0, 67.63, 0.0, 60.98, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 56.7], ["hum", 4.04], ["fly, housefly", 3.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 31.82], ["burping, eructation", 31.82], ["speech", 11.87]], null, null, null, null, null, [["stomach rumble", 63.72], ["noise", 9.22], ["whale vocalization", 3.06]], null, null, null, null, null], "duration": [2.48, 20.72, 1.45, 1.47, 0.77, 0.92, 0.92, 1.24, 2.46, -0.28, 1.46, 0.32, 1.72, 0.96, 0.71, -0.13, 0.69, 4.89, 0.2, 0.93, 2.36, 0.61, 2.63, 2.59, 0.7, 0.91, 0.61, -0.04, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/ebHQ50ZRvM4_filtered.json b/annotations_filtered/ebHQ50ZRvM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97f100b0d2d324821d12f0ac98cdec8e8a7eb722 --- /dev/null +++ b/annotations_filtered/ebHQ50ZRvM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [10.0, 10.54], [15.0, 17.49], [19.0, 41.27], [43.0, 44.19], [47.0, 47.44], [50.0, 50.97], [52.0, 51.75], [52.0, 51.87], [55.0, 54.95], [57.0, 95.17], [96.0, 97.56], [98.0, 101.61], [102.0, 107.47], [111.0, 112.9], [115.0, 115.7], [116.0, 118.83], [121.0, 125.69], [127.0, 128.14], [129.0, 130.42], [132.0, 149.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.43, 39.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.31, 47.62, 0.0, 0.0, 51.23, 52.62, 0.0, 0.0, 62.89], "audiomae_on_audioset": [null, null, [["music", 68.7], ["guitar", 7.66], ["musical instrument", 6.12]], [["music", 55.3], ["livestock, farm animals, working animals", 6.46], ["sheep", 6.12]], null, null, null, null, null, null, null, null, null, [["music", 50.44], ["speech", 23.44], ["synthesizer", 1.5]], null, null, null, null, null, null, null], "duration": [0.71, 0.54, 2.49, 22.27, 1.19, 0.44, 0.97, -0.25, -0.13, -0.05, 38.17, 1.56, 3.61, 5.47, 1.9, 0.7, 2.83, 4.69, 1.14, 1.42, 17.94]} \ No newline at end of file diff --git a/annotations_filtered/ebj_l5icPPg_filtered.json b/annotations_filtered/ebj_l5icPPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6fc9aa748d5fff1c830666c636603ed2bb31d14 --- /dev/null +++ b/annotations_filtered/ebj_l5icPPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.28], [19.0, 21.69], [22.0, 22.54], [30.0, 30.57], [33.0, 33.81], [39.0, 39.34], [41.0, 41.34], [42.0, 44.85], [57.0, 57.03], [57.0, 57.28], [60.0, 65.52], [69.0, 69.82], [72.0, 73.48], [75.0, 74.78], [76.0, 76.96], [78.0, 80.16], [81.0, 87.56], [88.0, 87.96], [88.0, 93.77], [95.0, 95.45], [96.0, 96.38], [98.0, 98.68], [107.0, 108.97], [111.0, 111.47]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.48, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 0.0, 99.91, 99.71, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 52.11], ["didgeridoo", 6.55], ["sonar", 6.26]], null, null, null, null, null, [["creak", 28.34], ["whale vocalization", 14.73], ["theremin", 10.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 2.69, 0.54, 0.57, 0.81, 0.34, 0.34, 2.85, 0.03, 0.28, 5.52, 0.82, 1.48, -0.22, 0.96, 2.16, 6.56, -0.04, 5.77, 0.45, 0.38, 0.68, 1.97, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/ebkY0u1-NKk_filtered.json b/annotations_filtered/ebkY0u1-NKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bca25d2594ab280702db763835f0bf82c2779da --- /dev/null +++ b/annotations_filtered/ebkY0u1-NKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.34], [15.0, 21.1], [26.0, 26.1], [27.0, 28.76], [31.0, 32.97], [34.0, 34.8], [36.0, 36.21], [38.0, 38.37], [40.0, 46.5], [48.0, 49.38], [50.0, 51.19], [52.0, 52.1], [53.0, 53.72], [55.0, 56.05], [57.0, 57.84], [59.0, 59.64], [63.0, 63.78], [68.0, 67.93], [68.0, 70.19], [71.0, 72.59], [76.0, 76.2], [78.0, 78.85], [82.0, 82.32], [85.0, 85.77], [96.0, 101.82], [102.0, 102.9], [105.0, 105.92], [107.0, 110.71], [111.0, 112.63], [114.0, 114.59], [120.0, 124.65]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 48.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 30.07, 0.0, 0.0, 39.86, 0.0, 0.0, 47.9], "audiomae_on_audioset": [null, [["hum", 40.81], ["throbbing", 15.34], ["radio", 7.47]], null, null, null, null, null, null, [["speech", 70.53], ["echo", 5.65], ["wail, moan", 5.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.45], ["fart", 11.46], ["whack, thwack", 5.39]], null, null, [["sidetone", 44.18], ["speech", 30.67], ["radio", 14.96]], null, null, [["hum", 19.34], ["fart", 11.96], ["speech", 7.94]]], "duration": [0.34, 6.1, 0.1, 1.76, 1.97, 0.8, 0.21, 0.37, 6.5, 1.38, 1.19, 0.1, 0.72, 1.05, 0.84, 0.64, 0.78, -0.07, 2.19, 1.59, 0.2, 0.85, 0.32, 0.77, 5.82, 0.9, 0.92, 3.71, 1.63, 0.59, 4.65]} \ No newline at end of file diff --git a/annotations_filtered/ec9h1IjltJg_filtered.json b/annotations_filtered/ec9h1IjltJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..666014ec76183e8ffe5e8af842593e986c5313d8 --- /dev/null +++ b/annotations_filtered/ec9h1IjltJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.34], [22.0, 30.28], [31.0, 98.93], [102.0, 102.46], [103.0, 104.67], [105.0, 107.42], [109.0, 109.66], [111.0, 116.78], [118.0, 119.47], [121.0, 123.79], [124.0, 127.14], [128.0, 129.1], [131.0, 131.41]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.22, 41.22, 0.0, 0.0, 0.0, 87.74, 0.0, 99.59, 0.0, 99.62, 55.74, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.37], ["singing bowl", 15.42], ["speech", 10.14]], [["music", 37.2], ["hum", 14.41], ["mains hum", 9.79]], null, null, null, null, null, null, null, null, null, null, null], "duration": [13.34, 8.28, 67.93, 0.46, 1.67, 2.42, 0.66, 5.78, 1.47, 2.79, 3.14, 1.1, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/ecWhXP2jM28_filtered.json b/annotations_filtered/ecWhXP2jM28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ecWhXP2jM28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/eclUi6kVFcM_filtered.json b/annotations_filtered/eclUi6kVFcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abc7ea596200b2baf4cfcfa1e546a11e9fbc7b2b --- /dev/null +++ b/annotations_filtered/eclUi6kVFcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.75], [10.0, 11.69], [30.0, 33.47], [36.0, 41.15], [43.0, 46.58], [56.0, 57.15], [61.0, 61.89], [64.0, 64.72], [78.0, 83.61], [84.0, 84.32], [86.0, 86.44], [89.0, 89.14], [93.0, 93.39], [94.0, 95.01], [96.0, 96.57], [98.0, 98.47], [100.0, 100.84], [107.0, 106.88], [114.0, 114.94], [115.0, 116.31], [117.0, 123.26], [130.0, 130.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.33, 37.95, 39.37, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0], "audiomae_on_audioset": [null, null, [["music", 64.18], ["chorus effect", 9.98], ["effects unit", 4.24]], [["music", 80.75], ["singing", 1.75], ["country", 1.26]], [["music", 76.22], ["middle eastern music", 2.14], ["musical instrument", 1.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 1.69, 3.47, 5.15, 3.58, 1.15, 0.89, 0.72, 5.61, 0.32, 0.44, 0.14, 0.39, 1.01, 0.57, 0.47, 0.84, -0.12, 0.94, 1.31, 6.26, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/ecmDPqCP8ms_filtered.json b/annotations_filtered/ecmDPqCP8ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648f49308d26ed08d815634200c336f6f7b47e9d --- /dev/null +++ b/annotations_filtered/ecmDPqCP8ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [16.0, 17.07], [18.0, 18.39], [19.0, 20.88], [22.0, 23.95], [25.0, 26.74], [27.0, 29.79], [30.0, 31.77], [32.0, 33.93], [37.0, 39.5], [41.0, 42.23], [46.0, 46.58], [48.0, 49.74], [52.0, 51.83], [54.0, 54.97], [57.0, 57.59], [59.0, 59.04], [61.0, 71.59], [77.0, 78.83], [80.0, 82.04], [86.0, 87.93], [88.0, 92.85], [93.0, 95.69], [96.0, 99.82], [101.0, 103.32], [106.0, 106.84], [107.0, 108.53], [112.0, 111.75], [114.0, 115.64], [119.0, 119.57], [125.0, 124.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 99.78, 0.0, 99.31, 98.01, 99.92, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.07, 0.39, 1.88, 1.95, 1.74, 2.79, 1.77, 1.93, 2.5, 1.23, 0.58, 1.74, -0.17, 0.97, 0.59, 0.04, 10.59, 1.83, 2.04, 1.93, 4.85, 2.69, 3.82, 2.32, 0.84, 1.53, -0.25, 1.64, 0.57, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/ecmRksfy--I_filtered.json b/annotations_filtered/ecmRksfy--I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09476f188ace1b56f5fa2a3ed3b4681cdc836842 --- /dev/null +++ b/annotations_filtered/ecmRksfy--I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.48], [51.0, 51.39]], "keep_status": [true, false], "silence_prob": [46.94, 0.0], "audiomae_on_audioset": [[["frog", 28.9], ["music", 17.19], ["croak", 6.11]], null], "duration": [2.48, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/ecsPydUbYGM_filtered.json b/annotations_filtered/ecsPydUbYGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f80d7ab54eb4df10064f63bddf30483a65bf817 --- /dev/null +++ b/annotations_filtered/ecsPydUbYGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.51], [15.0, 16.33], [18.0, 19.68], [20.0, 21.47], [27.0, 41.84], [46.0, 49.27], [50.0, 50.94], [54.0, 67.76], [72.0, 76.28], [77.0, 78.43], [79.0, 81.16], [82.0, 90.05], [91.0, 91.76], [96.0, 98.25], [101.0, 115.1], [115.0, 124.75], [126.0, 127.6]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [44.96, 0.0, 0.0, 0.0, 62.78, 58.81, 0.0, 40.59, 41.98, 0.0, 33.53, 43.08, 0.0, 39.21, 55.89, 48.19, 0.0], "audiomae_on_audioset": [[["hum", 43.28], ["mains hum", 13.75], ["throbbing", 8.2]], null, null, null, null, null, null, [["music", 32.42], ["speech", 19.84], ["theremin", 19.74]], [["hum", 19.4], ["speech", 18.19], ["mains hum", 14.93]], null, [["speech", 41.62], ["music", 16.44], ["theremin", 9.31]], [["music", 48.21], ["theremin", 16.7], ["singing bowl", 7.24]], null, [["theremin", 48.38], ["music", 25.21], ["musical instrument", 3.63]], null, [["speech", 47.32], ["hum", 19.12], ["mains hum", 8.87]], null], "duration": [3.51, 1.33, 1.68, 1.47, 14.84, 3.27, 0.94, 13.76, 4.28, 1.43, 2.16, 8.05, 0.76, 2.25, 14.1, 9.75, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/edBNDiSwnlg_filtered.json b/annotations_filtered/edBNDiSwnlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7a16ff55913a768c580361406abffa52472c311 --- /dev/null +++ b/annotations_filtered/edBNDiSwnlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 42.58], [43.0, 43.33], [44.0, 46.16], [53.0, 98.27], [100.0, 100.84], [102.0, 145.23]], "keep_status": [true, false, true, false, false, false], "silence_prob": [30.77, 0.0, 35.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 22.91], ["music", 13.83], ["animal", 13.09]], null, [["speech", 34.21], ["music", 20.53], ["hum", 11.53]], null, null, null], "duration": [17.58, 0.33, 2.16, 45.27, 0.84, 43.23]} \ No newline at end of file diff --git a/annotations_filtered/edHmOaS0lRU_filtered.json b/annotations_filtered/edHmOaS0lRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c119e136408e6906cf79375a9198122a98e8e112 --- /dev/null +++ b/annotations_filtered/edHmOaS0lRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.99], [12.0, 35.48], [41.0, 61.43], [65.0, 77.33], [81.0, 81.67], [83.0, 93.43], [96.0, 95.82], [97.0, 99.47], [102.0, 126.86], [129.0, 134.89], [137.0, 158.62], [160.0, 159.63]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [28.74, 28.9, 29.57, 30.19, 0.0, 29.66, 0.0, 30.53, 29.37, 29.8, 29.65, 0.0], "audiomae_on_audioset": [[["speech", 27.97], ["explosion", 15.54], ["burst, pop", 13.17]], [["music", 29.9], ["cacophony", 10.32], ["explosion", 10.18]], [["music", 47.88], ["smash, crash", 8.98], ["clang", 6.64]], [["music", 67.72], ["speech", 18.13], ["gunshot, gunfire", 2.28]], null, [["machine gun", 28.65], ["speech", 26.78], ["music", 19.87]], null, [["music", 65.01], ["throbbing", 8.76], ["trance music", 3.52]], [["music", 83.11], ["smash, crash", 2.2], ["cacophony", 1.97]], [["music", 63.24], ["speech", 17.65], ["throbbing", 4.84]], [["music", 47.91], ["speech", 34.04], ["breaking", 2.05]], null], "duration": [5.99, 23.48, 20.43, 12.33, 0.67, 10.43, -0.18, 2.47, 24.86, 5.89, 21.62, -0.37]} \ No newline at end of file diff --git a/annotations_filtered/edQy5jBxhV8_filtered.json b/annotations_filtered/edQy5jBxhV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49cccc5fd2e0b09430e14bee90fec8d68ebf743a --- /dev/null +++ b/annotations_filtered/edQy5jBxhV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [8.0, 9.12], [14.0, 14.59], [17.0, 18.77], [20.0, 20.01], [26.0, 28.41], [29.0, 30.06], [34.0, 34.55], [35.0, 35.67], [39.0, 44.68], [45.0, 45.47], [46.0, 47.17], [48.0, 55.05], [57.0, 58.87], [61.0, 65.85], [67.0, 72.08], [73.0, 73.16], [74.0, 74.71], [75.0, 75.81], [76.0, 80.18], [81.0, 84.69], [92.0, 95.91], [97.0, 97.77], [99.0, 101.14], [102.0, 106.91], [108.0, 108.26], [114.0, 114.96], [116.0, 116.26], [119.0, 122.74], [124.0, 127.89], [128.0, 129.59], [133.0, 135.57], [138.0, 138.67], [143.0, 144.29], [145.0, 145.22], [146.0, 146.89], [148.0, 149.03], [154.0, 153.93], [156.0, 159.7], [168.0, 167.88], [171.0, 174.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 68.02, 0.0, 0.0, 0.0, 98.66, 76.2, 100.0, 0.0, 99.97, 98.66, 0.0, 0.0, 0.0, 100.0, 87.55, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.12, 0.59, 1.77, 0.01, 2.41, 1.06, 0.55, 0.67, 5.68, 0.47, 1.17, 7.05, 1.87, 4.85, 5.08, 0.16, 0.71, 0.81, 4.18, 3.69, 3.91, 0.77, 2.14, 4.91, 0.26, 0.96, 0.26, 3.74, 3.89, 1.59, 2.57, 0.67, 1.29, 0.22, 0.89, 1.03, -0.07, 3.7, -0.12, 3.18]} \ No newline at end of file diff --git a/annotations_filtered/edX09NFZ3oc_filtered.json b/annotations_filtered/edX09NFZ3oc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d30d0160bfb8e0089d9956258b9fc7e52f205f2d --- /dev/null +++ b/annotations_filtered/edX09NFZ3oc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.5], [8.0, 8.92], [9.0, 13.69], [23.0, 23.9], [35.0, 47.56], [51.0, 51.46], [54.0, 54.51], [57.0, 57.38], [58.0, 58.83], [61.0, 61.03], [64.0, 63.71], [67.0, 67.42], [69.0, 69.85], [72.0, 72.96], [78.0, 78.19], [84.0, 84.59], [92.0, 93.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.73, 0.0, 82.97, 0.0, 59.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.5, 0.92, 4.69, 0.9, 12.56, 0.46, 0.51, 0.38, 0.83, 0.03, -0.29, 0.42, 0.85, 0.96, 0.19, 0.59, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/edaHyeIxzcI_filtered.json b/annotations_filtered/edaHyeIxzcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12c1143b2b2782f7534150f0bc8759a5138d72b6 --- /dev/null +++ b/annotations_filtered/edaHyeIxzcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 33.03], [35.0, 52.41], [87.0, 93.61], [98.0, 106.59], [108.0, 130.13], [131.0, 131.89]], "keep_status": [true, true, false, false, true, false], "silence_prob": [28.77, 28.5, 28.49, 28.67, 28.72, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 23.73], ["moo", 16.47], ["livestock, farm animals, working animals", 10.87]], [["sidetone", 30.71], ["speech", 12.96], ["music", 8.55]], [["cattle, bovinae", 37.13], ["moo", 31.01], ["livestock, farm animals, working animals", 30.37]], [["livestock, farm animals, working animals", 52.48], ["cattle, bovinae", 29.5], ["moo", 14.9]], [["music", 19.75], ["speech", 11.15], ["hum", 8.0]], null], "duration": [2.03, 17.41, 6.61, 8.59, 22.13, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/edgiUq5ymRE_filtered.json b/annotations_filtered/edgiUq5ymRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d123f0c5a89756f51281793b694ab2c102a0f7f6 --- /dev/null +++ b/annotations_filtered/edgiUq5ymRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.97], [17.0, 19.11], [22.0, 22.15], [23.0, 26.38], [28.0, 29.1], [30.0, 30.01], [31.0, 35.63], [41.0, 42.13], [46.0, 49.37], [50.0, 58.85], [59.0, 65.15], [67.0, 72.05], [75.0, 75.76], [78.0, 78.46], [80.0, 81.28], [83.0, 85.7], [86.0, 87.67], [89.0, 89.18], [90.0, 95.08], [97.0, 98.66], [101.0, 103.91], [105.0, 106.79], [108.0, 109.39], [110.0, 113.53], [116.0, 120.33], [121.0, 125.14], [126.0, 136.44], [137.0, 140.16], [141.0, 146.1], [147.0, 150.72], [152.0, 152.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [93.91, 97.11, 0.0, 99.99, 0.0, 0.0, 99.59, 0.0, 99.97, 81.89, 99.84, 99.48, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 98.51, 0.0, 99.71, 0.0, 0.0, 99.78, 89.72, 99.98, 100.0, 99.56, 94.22, 48.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.28], ["speech", 14.03], ["throbbing", 2.56]], null], "duration": [9.97, 2.11, 0.15, 3.38, 1.1, 0.01, 4.63, 1.13, 3.37, 8.85, 6.15, 5.05, 0.76, 0.46, 1.28, 2.7, 1.67, 0.18, 5.08, 1.66, 2.91, 1.79, 1.39, 3.53, 4.33, 4.14, 10.44, 3.16, 5.1, 3.72, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/edhJGqAjG7s_filtered.json b/annotations_filtered/edhJGqAjG7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2d9997db706aca3e96db6c0b11d5af303248d1b --- /dev/null +++ b/annotations_filtered/edhJGqAjG7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.01], [8.0, 12.31], [13.0, 51.22], [57.0, 62.85], [64.0, 64.08], [66.0, 66.53], [69.0, 68.89], [70.0, 71.47], [72.0, 75.81], [77.0, 82.9], [84.0, 85.5], [93.0, 94.86], [96.0, 96.04], [96.0, 98.88], [100.0, 102.37], [103.0, 104.63], [106.0, 107.2]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.63, 29.83, 0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 58.22, 76.37, 0.0, 0.0, 0.0, 45.05, 59.24, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.87], ["musical instrument", 6.78], ["speech", 3.82]], [["mains hum", 31.88], ["hum", 28.72], ["music", 13.64]], null, [["hum", 40.61], ["music", 16.84], ["throbbing", 9.73]], null, null, null, null, null, null, null, null, null, [["music", 34.79], ["speech", 24.44], ["hum", 5.28]], null, null, null], "duration": [4.01, 4.31, 38.22, 5.85, 0.08, 0.53, -0.11, 1.47, 3.81, 5.9, 1.5, 1.86, 0.04, 2.88, 2.37, 1.63, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/eeGuOguh33o_filtered.json b/annotations_filtered/eeGuOguh33o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5e6b2a89441bc11a02c6ee52eec980e422337fa --- /dev/null +++ b/annotations_filtered/eeGuOguh33o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.04], [15.0, 15.38], [16.0, 16.51], [18.0, 17.9], [19.0, 20.07], [29.0, 29.57], [33.0, 32.8], [33.0, 33.52], [38.0, 37.76], [39.0, 39.75], [43.0, 43.71], [48.0, 53.7], [62.0, 62.82], [67.0, 68.07], [71.0, 73.4], [77.0, 77.03], [77.0, 77.72], [79.0, 79.52], [83.0, 83.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [36.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.09, 0.0, 0.0, 44.78, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 43.28], ["hum", 16.31], ["throbbing", 11.77]], null, null, null, null, null, null, null, null, null, null, [["speech", 70.14], ["music", 9.85], ["hum", 2.83]], null, null, [["speech", 18.96], ["owl", 6.16], ["hoot", 5.72]], null, null, null, null], "duration": [11.04, 0.38, 0.51, -0.1, 1.07, 0.57, -0.2, 0.52, -0.24, 0.75, 0.71, 5.7, 0.82, 1.07, 2.4, 0.03, 0.72, 0.52, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/eeR4VQyoLdc_filtered.json b/annotations_filtered/eeR4VQyoLdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c59ea60065a10c1dc0f2af3e363911756f29432 --- /dev/null +++ b/annotations_filtered/eeR4VQyoLdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 50.18], [51.0, 59.61], [60.0, 60.32], [81.0, 81.26], [98.0, 100.06], [101.0, 102.19], [104.0, 105.38], [106.0, 107.25], [110.0, 110.93], [114.0, 115.94], [122.0, 123.18], [127.0, 129.2], [130.0, 132.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 34.28, 0.0, 0.0, 57.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 37.82], "audiomae_on_audioset": [null, [["music", 31.41], ["hum", 30.6], ["mains hum", 11.49]], null, null, null, null, null, null, null, null, null, [["music", 36.64], ["hum", 12.44], ["mains hum", 7.03]], [["mains hum", 20.81], ["hum", 18.83], ["bee, wasp, etc.", 17.18]]], "duration": [31.18, 8.61, 0.32, 0.26, 2.06, 1.19, 1.38, 1.25, 0.93, 1.94, 1.18, 2.2, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/eeWPnGsY-Xc_filtered.json b/annotations_filtered/eeWPnGsY-Xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..664b6e4bb3769c6ea34bcdd937dc02b42c5a3ff1 --- /dev/null +++ b/annotations_filtered/eeWPnGsY-Xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.17], [6.0, 6.66], [8.0, 8.77], [10.0, 10.62], [12.0, 12.46], [13.0, 13.49], [15.0, 15.75], [17.0, 16.75], [18.0, 18.03], [22.0, 22.08], [25.0, 25.05], [27.0, 27.46], [29.0, 29.24], [32.0, 31.95], [35.0, 35.07], [38.0, 38.96], [40.0, 40.15], [41.0, 41.34], [42.0, 42.75], [47.0, 47.87], [51.0, 51.24], [52.0, 52.2], [56.0, 57.59], [60.0, 61.37], [63.0, 65.13], [67.0, 67.53], [70.0, 70.39], [71.0, 71.59], [75.0, 75.19], [76.0, 75.78], [80.0, 80.76], [83.0, 84.15], [87.0, 87.64], [89.0, 90.51], [94.0, 93.95], [95.0, 95.08], [97.0, 97.73], [99.0, 99.55], [101.0, 101.39], [104.0, 104.52], [108.0, 108.18], [110.0, 110.46], [113.0, 113.54], [115.0, 115.52], [117.0, 117.88], [120.0, 135.38], [136.0, 136.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 42.77], ["music", 26.28], ["mains hum", 13.99]], null], "duration": [2.17, 0.66, 0.77, 0.62, 0.46, 0.49, 0.75, -0.25, 0.03, 0.08, 0.05, 0.46, 0.24, -0.05, 0.07, 0.96, 0.15, 0.34, 0.75, 0.87, 0.24, 0.2, 1.59, 1.37, 2.13, 0.53, 0.39, 0.59, 0.19, -0.22, 0.76, 1.15, 0.64, 1.51, -0.05, 0.08, 0.73, 0.55, 0.39, 0.52, 0.18, 0.46, 0.54, 0.52, 0.88, 15.38, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/eeXePDLKsmU_filtered.json b/annotations_filtered/eeXePDLKsmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe0e385728ff87c2bfe2d43c7a847814a107ae86 --- /dev/null +++ b/annotations_filtered/eeXePDLKsmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.69], [7.0, 7.77], [8.0, 9.22], [10.0, 11.65], [13.0, 13.31], [14.0, 15.08], [22.0, 22.28], [26.0, 26.76], [29.0, 29.88], [33.0, 34.03], [37.0, 38.13], [38.0, 39.21], [43.0, 44.32], [45.0, 45.39], [46.0, 48.52], [51.0, 51.92], [54.0, 54.63], [55.0, 55.38], [60.0, 59.81], [63.0, 64.0], [65.0, 65.58], [66.0, 66.56], [70.0, 71.04], [72.0, 75.36], [79.0, 79.73], [86.0, 87.35], [89.0, 89.19], [94.0, 94.61], [99.0, 99.13], [100.0, 100.95], [101.0, 101.82], [102.0, 103.42], [106.0, 106.78], [108.0, 108.95], [110.0, 111.23], [112.0, 112.85], [114.0, 116.07], [117.0, 118.56], [122.0, 122.44], [124.0, 126.08], [126.0, 127.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 84.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.69, 0.77, 1.22, 1.65, 0.31, 1.08, 0.28, 0.76, 0.88, 1.03, 1.13, 1.21, 1.32, 0.39, 2.52, 0.92, 0.63, 0.38, -0.19, 1.0, 0.58, 0.56, 1.04, 3.36, 0.73, 1.35, 0.19, 0.61, 0.13, 0.95, 0.82, 1.42, 0.78, 0.95, 1.23, 0.85, 2.07, 1.56, 0.44, 2.08, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/eensusNo-jE_filtered.json b/annotations_filtered/eensusNo-jE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89df60b366b9bc1f5798131d2306e48f52cc0919 --- /dev/null +++ b/annotations_filtered/eensusNo-jE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.77], [6.0, 10.47], [12.0, 11.96], [28.0, 29.19], [33.0, 33.57], [34.0, 34.77], [39.0, 38.96], [43.0, 43.85], [46.0, 46.47], [65.0, 69.21], [69.0, 70.43], [72.0, 78.04], [81.0, 80.77], [86.0, 91.05], [92.0, 93.53], [94.0, 96.26], [99.0, 101.41], [103.0, 103.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 76.04, 0.0, 99.98, 0.0, 85.17, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 4.47, -0.04, 1.19, 0.57, 0.77, -0.04, 0.85, 0.47, 4.21, 1.43, 6.04, -0.23, 5.05, 1.53, 2.26, 2.41, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/ef77ViM-f14_filtered.json b/annotations_filtered/ef77ViM-f14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d916581b13bcaf0d80ee3b5a2dc5c387d25dd437 --- /dev/null +++ b/annotations_filtered/ef77ViM-f14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.15], [21.0, 21.78], [26.0, 28.02], [40.0, 41.23], [42.0, 45.99], [54.0, 55.53], [64.0, 67.73], [69.0, 70.24], [71.0, 71.98], [73.0, 77.92], [79.0, 82.65], [96.0, 97.07], [110.0, 110.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.04, 0.0, 96.77, 0.0, 33.03, 0.0, 0.0, 37.54, 85.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 60.41], ["sidetone", 25.99], ["dial tone", 2.65]], null, null, [["speech", 72.65], ["sidetone", 16.09], ["telephone", 3.85]], null, null, null], "duration": [1.15, 0.78, 2.02, 1.23, 3.99, 1.53, 3.73, 1.24, 0.98, 4.92, 3.65, 1.07, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/ef7rQniaz5c_filtered.json b/annotations_filtered/ef7rQniaz5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ff6f1d59e20e3b78024f237ab2e563223ee7879 --- /dev/null +++ b/annotations_filtered/ef7rQniaz5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [2.0, 3.64], [6.0, 6.47], [11.0, 12.72], [15.0, 16.34], [22.0, 22.23], [25.0, 26.42], [28.0, 31.13], [32.0, 33.56], [34.0, 34.74], [37.0, 39.77], [41.0, 45.99], [46.0, 50.25], [53.0, 56.59], [58.0, 59.56], [62.0, 62.8], [64.0, 64.98], [66.0, 68.4], [69.0, 70.14], [72.0, 79.27], [80.0, 83.1], [84.0, 86.66], [88.0, 99.32], [101.0, 115.86], [117.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 84.8, 99.98, 83.52, 96.29, 0.0, 0.0, 0.0, 73.82, 0.0, 99.97, 100.0, 77.03, 95.91, 83.7, 74.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.64, 0.47, 1.72, 1.34, 0.23, 1.42, 3.13, 1.56, 0.74, 2.77, 4.99, 4.25, 3.59, 1.56, 0.8, 0.98, 2.4, 1.14, 7.27, 3.1, 2.66, 11.32, 14.86, 5.94]} \ No newline at end of file diff --git a/annotations_filtered/efNMnSL6Wlg_filtered.json b/annotations_filtered/efNMnSL6Wlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..429ef5648c56dc4b5f64d6c743ab6f632428a3a6 --- /dev/null +++ b/annotations_filtered/efNMnSL6Wlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.5], [4.0, 6.72], [7.0, 10.66], [11.0, 17.66], [18.0, 18.99], [20.0, 21.56], [23.0, 24.19], [31.0, 34.48], [36.0, 38.13], [39.0, 40.81], [43.0, 46.08], [47.0, 47.49], [49.0, 55.07], [56.0, 64.72], [69.0, 73.82], [74.0, 77.25], [79.0, 82.02], [85.0, 87.1], [88.0, 88.42], [89.0, 91.1], [91.0, 95.44], [97.0, 98.74], [102.0, 104.84], [106.0, 109.93], [114.0, 118.05], [120.0, 122.62], [124.0, 125.49], [127.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 99.94, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 99.98, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 2.72, 3.66, 6.66, 0.99, 1.56, 1.19, 3.48, 2.13, 1.81, 3.08, 0.49, 6.07, 8.72, 4.82, 3.25, 3.02, 2.1, 0.42, 2.1, 4.44, 1.74, 2.84, 3.93, 4.05, 2.62, 1.49, 5.63]} \ No newline at end of file diff --git a/annotations_filtered/efkuXTpfxhc_filtered.json b/annotations_filtered/efkuXTpfxhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b43e67bc40dc2dc788b11c5f89012637efde9c85 --- /dev/null +++ b/annotations_filtered/efkuXTpfxhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.81], [13.0, 14.5], [18.0, 18.52], [22.0, 22.28], [24.0, 25.44], [26.0, 26.79], [31.0, 31.45], [40.0, 42.16], [43.0, 43.87], [45.0, 49.28], [54.0, 58.09], [59.0, 61.03], [63.0, 69.43], [70.0, 91.89], [92.0, 103.01], [105.0, 108.09], [111.0, 112.56], [116.0, 116.19], [118.0, 121.83], [122.0, 124.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 82.25, 57.81, 75.55, 87.37, 47.94, 40.09, 99.26, 0.0, 0.0, 82.07, 39.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 60.18], ["radio", 8.42], ["music", 3.84]], null, null, null, null, null, [["music", 46.55], ["effects unit", 5.9], ["mains hum", 4.71]], [["music", 60.63], ["effects unit", 11.34], ["guitar", 4.68]], null, null, null, null, [["music", 39.07], ["fart", 12.6], ["speech", 6.43]]], "duration": [1.81, 1.5, 0.52, 0.28, 1.44, 0.79, 0.45, 2.16, 0.87, 4.28, 4.09, 2.03, 6.43, 21.89, 11.01, 3.09, 1.56, 0.19, 3.83, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/efqBAU-lT5Q_filtered.json b/annotations_filtered/efqBAU-lT5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19225fea3baacd4dec12cacd07ea489be2aec3e9 --- /dev/null +++ b/annotations_filtered/efqBAU-lT5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [8.0, 7.97], [9.0, 10.67], [13.0, 13.27], [14.0, 30.38], [32.0, 38.28], [40.0, 41.47], [48.0, 49.6], [57.0, 58.78], [69.0, 70.16], [76.0, 77.26]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.14, 42.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 58.05], ["hum", 10.9], ["mains hum", 4.89]], [["speech", 42.89], ["hum", 15.0], ["mains hum", 8.14]], null, null, null, null, null], "duration": [0.23, -0.03, 1.67, 0.27, 16.38, 6.28, 1.47, 1.6, 1.78, 1.16, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/eg8WzaSrZpg_filtered.json b/annotations_filtered/eg8WzaSrZpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c73494e2604208ba2f71549068033224a83e61b3 --- /dev/null +++ b/annotations_filtered/eg8WzaSrZpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 39.95], [43.0, 84.23], [88.0, 101.44], [104.0, 105.58], [112.0, 113.56], [114.0, 117.15], [118.0, 117.98]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 29.95, 0.0, 0.0, 29.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 68.42], ["throbbing", 2.78], ["hum", 2.65]], null, null, [["hum", 21.25], ["throbbing", 21.17], ["music", 19.66]], null], "duration": [-0.05, 41.23, 13.44, 1.58, 1.56, 3.15, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/egB-SG97EcI_filtered.json b/annotations_filtered/egB-SG97EcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a1b487628f3f9932486111e7594c88083a567fe --- /dev/null +++ b/annotations_filtered/egB-SG97EcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.55], [21.0, 20.87], [28.0, 28.61], [36.0, 36.53], [37.0, 41.86], [45.0, 45.57], [46.0, 55.11], [56.0, 56.15], [62.0, 73.82], [75.0, 75.25], [79.0, 80.37], [81.0, 82.43], [84.0, 83.83], [84.0, 85.48], [89.0, 90.05], [93.0, 93.55], [95.0, 95.66], [97.0, 98.76], [99.0, 100.4], [102.0, 106.0], [107.0, 108.23], [109.0, 109.51], [117.0, 118.4], [119.0, 121.54], [124.0, 123.63], [125.0, 126.86], [129.0, 129.96], [132.0, 132.02], [133.0, 135.65], [138.0, 139.33], [140.0, 142.91], [149.0, 150.04], [152.0, 152.54], [154.0, 155.55], [156.0, 156.57], [158.0, 158.57], [160.0, 160.32], [161.0, 161.32], [162.0, 171.36], [173.0, 173.96], [175.0, 175.32], [176.0, 181.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [81.17, 0.0, 0.0, 0.0, 84.43, 0.0, 66.88, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 39.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 38.59], ["burst, pop", 15.24], ["speech", 8.26]]], "duration": [4.55, -0.13, 0.61, 0.53, 4.86, 0.57, 9.11, 0.15, 11.82, 0.25, 1.37, 1.43, -0.17, 1.48, 1.05, 0.55, 0.66, 1.76, 1.4, 4.0, 1.23, 0.51, 1.4, 2.54, -0.37, 1.86, 0.96, 0.02, 2.65, 1.33, 2.91, 1.04, 0.54, 1.55, 0.57, 0.57, 0.32, 0.32, 9.36, 0.96, 0.32, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/egTtyS-PlRM_filtered.json b/annotations_filtered/egTtyS-PlRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d49cef1f9fd2ca47a404f2496c3b216c523432fe --- /dev/null +++ b/annotations_filtered/egTtyS-PlRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.25], [12.0, 13.2], [15.0, 15.87], [18.0, 19.26], [21.0, 27.65], [32.0, 32.21], [40.0, 58.24], [60.0, 61.91], [64.0, 68.27], [71.0, 71.04], [71.0, 71.1], [85.0, 85.58], [91.0, 90.68], [91.0, 98.12], [104.0, 119.23], [122.0, 122.28], [126.0, 127.63], [128.0, 129.3], [131.0, 132.71], [135.0, 137.74], [139.0, 140.48], [154.0, 153.93], [166.0, 173.23]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.15, 0.0, 0.0, 0.0, 45.05, 0.0, 33.08, 0.0, 38.95, 0.0, 0.0, 0.0, 0.0, 34.84, 32.14, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 35.57], "audiomae_on_audioset": [[["music", 57.83], ["synthesizer", 7.37], ["musical instrument", 3.73]], null, null, null, [["music", 54.69], ["hum", 10.07], ["mains hum", 7.16]], null, [["music", 45.72], ["hum", 16.16], ["speech", 10.32]], null, [["music", 30.09], ["synthesizer", 10.75], ["speech", 6.3]], null, null, null, null, [["speech", 37.1], ["music", 21.23], ["fart", 5.73]], [["music", 53.74], ["speech", 12.29], ["didgeridoo", 8.46]], null, null, null, null, null, null, null, [["mains hum", 52.76], ["hum", 18.66], ["noise", 9.55]]], "duration": [2.25, 1.2, 0.87, 1.26, 6.65, 0.21, 18.24, 1.91, 4.27, 0.04, 0.1, 0.58, -0.32, 7.12, 15.23, 0.28, 1.63, 1.3, 1.71, 2.74, 1.48, -0.07, 7.23]} \ No newline at end of file diff --git a/annotations_filtered/egrmjjy2Pgo_filtered.json b/annotations_filtered/egrmjjy2Pgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f7e009b58b72d25b2c839c0f99f0b458ebdfc22 --- /dev/null +++ b/annotations_filtered/egrmjjy2Pgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.62], [28.0, 28.46], [30.0, 30.5], [31.0, 37.32], [38.0, 38.08], [39.0, 39.26], [40.0, 41.2], [42.0, 42.8], [44.0, 44.98], [46.0, 46.03], [48.0, 51.19], [52.0, 53.03], [54.0, 54.62], [58.0, 58.89], [60.0, 61.33], [63.0, 64.2], [66.0, 67.31], [68.0, 70.56], [71.0, 70.93], [72.0, 72.77], [74.0, 74.82], [78.0, 80.2], [81.0, 82.63], [83.0, 84.47], [85.0, 86.31], [87.0, 88.87], [90.0, 91.93], [95.0, 95.76], [97.0, 97.31], [100.0, 102.79], [107.0, 109.22]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [36.74, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 47.94], "audiomae_on_audioset": [[["music", 40.09], ["speech", 25.03], ["didgeridoo", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.73], ["speech", 10.4], ["musical instrument", 7.43]]], "duration": [10.62, 0.46, 0.5, 6.32, 0.08, 0.26, 1.2, 0.8, 0.98, 0.03, 3.19, 1.03, 0.62, 0.89, 1.33, 1.2, 1.31, 2.56, -0.07, 0.77, 0.82, 2.2, 1.63, 1.47, 1.31, 1.87, 1.93, 0.76, 0.31, 2.79, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/egwR6gS9UMM_filtered.json b/annotations_filtered/egwR6gS9UMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/egwR6gS9UMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/eh3TXsx8B40_filtered.json b/annotations_filtered/eh3TXsx8B40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41feaefdb1516a7bd8d503064b5be22eeb339acb --- /dev/null +++ b/annotations_filtered/eh3TXsx8B40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.59], [14.0, 19.77], [23.0, 24.16], [27.0, 27.8], [33.0, 34.65], [38.0, 38.8], [43.0, 43.04], [49.0, 50.52], [58.0, 59.09], [70.0, 85.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.6, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["cheering", 32.55], ["crowd", 32.32], ["music", 9.93]]], "duration": [4.59, 5.77, 1.16, 0.8, 1.65, 0.8, 0.04, 1.52, 1.09, 15.13]} \ No newline at end of file diff --git a/annotations_filtered/ehNNyfvhcto_filtered.json b/annotations_filtered/ehNNyfvhcto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b30e97a39881728fccb1e6268d43699b7da3df76 --- /dev/null +++ b/annotations_filtered/ehNNyfvhcto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.2], [13.0, 14.67], [17.0, 48.74], [52.0, 52.27], [53.0, 54.78], [63.0, 64.49], [68.0, 68.64], [76.0, 77.25], [83.0, 83.37], [91.0, 92.3]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 31.11], ["music", 18.79], ["breaking", 8.72]], null, null, null, null, null, null, null, null, null], "duration": [4.2, 1.67, 31.74, 0.27, 1.78, 1.49, 0.64, 1.25, 0.37, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/ehdAEyAGBEc_filtered.json b/annotations_filtered/ehdAEyAGBEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f79f49cddc4ab96f69cf2c1315b0ca4ff8227741 --- /dev/null +++ b/annotations_filtered/ehdAEyAGBEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [5.0, 7.06], [7.0, 10.0], [11.0, 13.26], [14.0, 15.8], [16.0, 19.57], [21.0, 21.24], [25.0, 26.79], [30.0, 31.5], [33.0, 33.76], [34.0, 34.74], [35.0, 36.9], [38.0, 38.01], [38.0, 41.44], [43.0, 47.46], [49.0, 50.45], [52.0, 56.03], [57.0, 63.98], [65.0, 66.65], [68.0, 68.61], [70.0, 73.84], [75.0, 77.73], [78.0, 80.89], [82.0, 95.66], [99.0, 99.03], [101.0, 104.11], [105.0, 106.2], [107.0, 108.51], [111.0, 112.55], [113.0, 115.37], [116.0, 118.76], [120.0, 121.51], [122.0, 124.65], [126.0, 127.13], [128.0, 129.74]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.72, 41.93, 99.26, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 99.99, 0.0, 78.72, 92.15, 0.0, 0.0, 100.0, 100.0, 55.81, 49.59, 0.0, 82.25, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 63.85, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 58.41], ["sine wave", 7.2], ["sidetone", 4.9]], [["speech", 57.37], ["stomach rumble", 5.86], ["synthesizer", 4.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.92], ["stomach rumble", 6.2], ["hum", 4.29]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 2.06, 3.0, 2.26, 1.8, 3.57, 0.24, 1.79, 1.5, 0.76, 0.74, 1.9, 0.01, 3.44, 4.46, 1.45, 4.03, 6.98, 1.65, 0.61, 3.84, 2.73, 2.89, 13.66, 0.03, 3.11, 1.2, 1.51, 1.55, 2.37, 2.76, 1.51, 2.65, 1.13, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/ei1tTWCrHqc_filtered.json b/annotations_filtered/ei1tTWCrHqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca8a978cae23485837e4023d245f3ffd15cf6092 --- /dev/null +++ b/annotations_filtered/ei1tTWCrHqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.6], [14.0, 16.41], [17.0, 17.63], [19.0, 18.93], [26.0, 26.65], [29.0, 28.85], [30.0, 29.88], [30.0, 31.02], [38.0, 37.98], [40.0, 46.16], [47.0, 48.12], [54.0, 54.4], [60.0, 60.39], [66.0, 76.98], [77.0, 79.37]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.47, 0.0, 0.0, 0.0, 37.19, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["explosion", 19.19], ["burst, pop", 17.39], ["speech", 10.64]], null, null, null, [["music", 50.27], ["echo", 8.09], ["speech", 5.93]], null], "duration": [1.6, 2.41, 0.63, -0.07, 0.65, -0.15, -0.12, 1.02, -0.02, 6.16, 1.12, 0.4, 0.39, 10.98, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/ei2dYpiS-Us_filtered.json b/annotations_filtered/ei2dYpiS-Us_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d945fa935cec195142335de907641e9af1f13e --- /dev/null +++ b/annotations_filtered/ei2dYpiS-Us_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [9.0, 9.14], [10.0, 10.49], [11.0, 12.01], [16.0, 16.63], [19.0, 20.19], [20.0, 20.8], [22.0, 23.11], [25.0, 28.09], [31.0, 56.49], [57.0, 59.81], [65.0, 70.73], [71.0, 70.93], [71.0, 76.0], [80.0, 80.3], [84.0, 84.27], [86.0, 88.4], [93.0, 95.72], [97.0, 97.6]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 34.93, 85.54, 38.25, 0.0, 42.93, 0.0, 0.0, 42.19, 34.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 29.57], ["mains hum", 20.35], ["hum", 13.82]], [["hum", 45.32], ["mains hum", 20.79], ["music", 12.22]], null, [["music", 23.63], ["speech", 11.28], ["fly, housefly", 11.13]], null, [["music", 36.05], ["throbbing", 32.96], ["hum", 9.77]], null, null, [["music", 58.92], ["throbbing", 11.42], ["didgeridoo", 6.13]], [["music", 43.34], ["speech", 8.0], ["throbbing", 6.78]], null], "duration": [0.56, 0.14, 0.49, 1.01, 0.63, 1.19, 0.8, 1.11, 3.09, 25.49, 2.81, 5.73, -0.07, 5.0, 0.3, 0.27, 2.4, 2.72, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/eiKSmbxn4UY_filtered.json b/annotations_filtered/eiKSmbxn4UY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb714e9406fa0a8f4de1d37f2ee67c34825de0ed --- /dev/null +++ b/annotations_filtered/eiKSmbxn4UY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [7.0, 7.13], [15.0, 18.0], [23.0, 23.13], [25.0, 25.69], [26.0, 30.64], [32.0, 32.56], [35.0, 34.94], [40.0, 41.1], [44.0, 44.69], [49.0, 51.33], [55.0, 56.93], [64.0, 68.0], [73.0, 73.62], [83.0, 85.9], [87.0, 86.98], [91.0, 92.4], [94.0, 94.2], [102.0, 102.37], [108.0, 108.9], [110.0, 111.6], [120.0, 121.69], [129.0, 128.7], [132.0, 139.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.55, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 33.21, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.73], ["grunt", 29.63], ["cattle, bovinae", 7.2]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.13, 3.0, 0.13, 0.69, 4.64, 0.56, -0.06, 1.1, 0.69, 2.33, 1.93, 4.0, 0.62, 2.9, -0.02, 1.4, 0.2, 0.37, 0.9, 1.6, 1.69, -0.3, 7.83]} \ No newline at end of file diff --git a/annotations_filtered/eiLeBJUf1iE_filtered.json b/annotations_filtered/eiLeBJUf1iE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec2d2de23e8d999fcc0de91b43371cbcf6c4ba8d --- /dev/null +++ b/annotations_filtered/eiLeBJUf1iE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.02], [18.0, 19.79], [20.0, 20.7], [23.0, 23.26], [24.0, 29.94], [36.0, 37.22], [41.0, 41.4], [43.0, 43.01], [49.0, 54.33], [55.0, 55.38], [58.0, 57.96], [59.0, 61.65], [64.0, 65.21], [66.0, 90.39], [91.0, 128.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 0.0, 0.0, 36.55, 0.0, 0.0, 0.0, 35.46, 0.0, 0.0, 44.18, 0.0, 36.4, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 60.87], ["speech", 5.52], ["boing", 3.59]], null, null, null, [["music", 76.57], ["speech", 2.73], ["boing", 2.17]], null, null, [["music", 82.52], ["musical instrument", 2.98], ["guitar", 2.32]], null, [["music", 79.21], ["swing music", 2.39], ["funny music", 2.07]], null], "duration": [4.02, 1.79, 0.7, 0.26, 5.94, 1.22, 0.4, 0.01, 5.33, 0.38, -0.04, 2.65, 1.21, 24.39, 37.38]} \ No newline at end of file diff --git a/annotations_filtered/eiQD0Wk6Ekg_filtered.json b/annotations_filtered/eiQD0Wk6Ekg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd61ac23fef950fbfb90f9b260095750c2e1a2b2 --- /dev/null +++ b/annotations_filtered/eiQD0Wk6Ekg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [5.0, 5.32], [6.0, 8.9], [13.0, 22.45], [24.0, 70.33], [71.0, 74.58], [75.0, 74.61], [75.0, 78.66], [79.0, 81.5]], "keep_status": [false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.17, 31.4, 0.0, 34.53, 0.0, 54.1, 89.36], "audiomae_on_audioset": [null, null, [["music", 44.03], ["smash, crash", 8.47], ["speech", 3.24]], [["speech", 59.5], ["buzz", 4.95], ["machine gun", 3.18]], null, [["frog", 24.71], ["sidetone", 16.19], ["croak", 7.53]], null, null, null], "duration": [0.71, 0.32, 2.9, 9.45, 46.33, 3.58, -0.39, 3.66, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/ej6dxNrh3Dc_filtered.json b/annotations_filtered/ej6dxNrh3Dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86bf05e34deae8043a9ce554be2834697fe9b26e --- /dev/null +++ b/annotations_filtered/ej6dxNrh3Dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.12], [22.0, 28.12], [29.0, 29.42], [31.0, 31.6], [32.0, 34.11], [38.0, 39.02], [39.0, 39.7], [40.0, 40.61], [44.0, 44.85], [50.0, 55.9], [59.0, 59.14], [61.0, 61.18], [64.0, 65.43], [73.0, 73.13], [74.0, 74.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.57, 40.01, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 66.6], ["inside, small room", 4.46], ["hum", 2.74]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.12, 6.12, 0.42, 0.6, 2.11, 1.02, 0.7, 0.61, 0.85, 5.9, 0.14, 0.18, 1.43, 0.13, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/ejD-W0F0hr8_filtered.json b/annotations_filtered/ejD-W0F0hr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecea21fc728383a77c7fc0264d3306dde7df817f --- /dev/null +++ b/annotations_filtered/ejD-W0F0hr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.81], [23.0, 23.82], [24.0, 30.21], [31.0, 41.18], [44.0, 45.5], [47.0, 47.31], [48.0, 48.36], [49.0, 49.71], [51.0, 72.08], [73.0, 73.65], [74.0, 74.26], [79.0, 84.91], [86.0, 87.91], [89.0, 90.81], [92.0, 121.61], [122.0, 122.76], [125.0, 126.18], [127.0, 130.81], [133.0, 141.4], [146.0, 147.18], [147.0, 159.78]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 37.27, 94.81, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 78.04, 0.0, 0.0, 67.0, 0.0, 0.0, 46.36, 41.16, 0.0, 38.93], "audiomae_on_audioset": [null, null, [["speech", 25.52], ["fart", 9.46], ["throbbing", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.36], ["theremin", 12.87], ["hum", 10.68]], [["music", 72.26], ["hum", 5.67], ["synthesizer", 4.0]], null, [["music", 56.53], ["speech", 32.29], ["fart", 1.56]]], "duration": [0.81, 0.82, 6.21, 10.18, 1.5, 0.31, 0.36, 0.71, 21.08, 0.65, 0.26, 5.91, 1.91, 1.81, 29.61, 0.76, 1.18, 3.81, 8.4, 1.18, 12.78]} \ No newline at end of file diff --git a/annotations_filtered/ejUWeYTslb0_filtered.json b/annotations_filtered/ejUWeYTslb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c95f9a46e7efaa285fa5abadef6be385d1d0932 --- /dev/null +++ b/annotations_filtered/ejUWeYTslb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.63], [5.0, 6.08], [8.0, 10.88], [28.0, 31.94], [33.0, 33.72], [41.0, 44.36], [47.0, 47.51], [49.0, 50.13], [53.0, 53.79], [55.0, 55.98], [62.0, 62.53], [65.0, 66.18], [71.0, 71.32], [73.0, 73.62], [78.0, 79.89], [81.0, 81.43], [82.0, 82.44], [84.0, 85.89], [92.0, 92.28], [95.0, 96.35], [100.0, 101.71], [103.0, 103.54], [105.0, 105.0], [106.0, 107.27], [113.0, 117.71], [122.0, 123.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.77, 0.0, 46.68, 69.07, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.86], ["sidetone", 24.62], ["dial tone", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.63, 1.08, 2.88, 3.94, 0.72, 3.36, 0.51, 1.13, 0.79, 0.98, 0.53, 1.18, 0.32, 0.62, 1.89, 0.43, 0.44, 1.89, 0.28, 1.35, 1.71, 0.54, 0.0, 1.27, 4.71, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/ek0jTQAdN8Y_filtered.json b/annotations_filtered/ek0jTQAdN8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bed3388e1d61ba283898087eb611cc99b17f5cb --- /dev/null +++ b/annotations_filtered/ek0jTQAdN8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.78], [3.0, 4.09], [4.0, 5.78], [9.0, 8.94], [9.0, 10.35], [11.0, 12.07], [15.0, 17.14], [18.0, 18.37], [19.0, 19.94], [22.0, 24.93], [25.0, 27.09], [30.0, 30.94], [32.0, 32.91], [36.0, 37.49], [43.0, 43.39], [44.0, 50.48], [56.0, 58.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 99.56, 91.98, 0.0, 0.0, 0.0, 0.0, 46.9, 38.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 30.77], ["music", 17.8], ["mains hum", 15.61]], [["hum", 39.08], ["mains hum", 22.27], ["throbbing", 7.13]]], "duration": [0.78, 1.09, 1.78, -0.06, 1.35, 1.07, 2.14, 0.37, 0.94, 2.93, 2.09, 0.94, 0.91, 1.49, 0.39, 6.48, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/ekSSp-zvdgk_filtered.json b/annotations_filtered/ekSSp-zvdgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad12f9dffd27adf73d0b01bbc97f2ec2e794c421 --- /dev/null +++ b/annotations_filtered/ekSSp-zvdgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.88], [18.0, 18.01], [24.0, 23.85], [25.0, 28.78], [30.0, 30.37], [32.0, 50.31], [52.0, 115.15], [121.0, 120.93], [123.0, 130.59], [132.0, 132.68]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 41.56, 0.0, 32.92, 0.0, 0.0, 47.16, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 47.94], ["sidetone", 17.01], ["radio", 15.26]], null, [["music", 32.94], ["throbbing", 28.05], ["hum", 22.12]], null, null, [["music", 28.64], ["didgeridoo", 22.21], ["speech", 10.65]], null], "duration": [1.88, 0.01, -0.15, 3.78, 0.37, 18.31, 63.15, -0.07, 7.59, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/ekqjBZdbYJU_filtered.json b/annotations_filtered/ekqjBZdbYJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fa45ede8110f320a477217b5a275e2da3cf1260 --- /dev/null +++ b/annotations_filtered/ekqjBZdbYJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [8.0, 9.26], [10.0, 11.84], [13.0, 15.16], [16.0, 17.41], [19.0, 26.25], [27.0, 35.87], [37.0, 37.99], [39.0, 40.53], [41.0, 57.65], [59.0, 70.51], [71.0, 80.2], [84.0, 83.86], [96.0, 97.78], [98.0, 101.75], [103.0, 105.48], [106.0, 106.56], [107.0, 107.62], [109.0, 109.43], [110.0, 110.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.89, 0.0, 50.86, 84.43, 0.0, 0.0, 91.81, 65.67, 30.66, 0.0, 0.0, 49.31, 58.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["explosion", 15.77], ["rumble", 12.29], ["whack, thwack", 11.87]], null, null, [["speech", 67.49], ["grunt", 5.43], ["animal", 4.31]], null, null, null, null, null], "duration": [0.13, 1.26, 1.84, 2.16, 1.41, 7.25, 8.87, 0.99, 1.53, 16.65, 11.51, 9.2, -0.14, 1.78, 3.75, 2.48, 0.56, 0.62, 0.43, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/elcYyXvJF7U_filtered.json b/annotations_filtered/elcYyXvJF7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36d4d1cc5034a882e46cd49274ddb691e90a4907 --- /dev/null +++ b/annotations_filtered/elcYyXvJF7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.62], [12.0, 146.35]], "keep_status": [false, false], "silence_prob": [32.0, 0.0], "audiomae_on_audioset": [[["speech", 38.25], ["music", 29.52], ["sonar", 7.81]], null], "duration": [5.62, 134.35]} \ No newline at end of file diff --git a/annotations_filtered/elmk8Hsbw_0_filtered.json b/annotations_filtered/elmk8Hsbw_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f5154bd215bbeb0f8ce5cbc90dbeff9571e1543 --- /dev/null +++ b/annotations_filtered/elmk8Hsbw_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [7.0, 7.18], [10.0, 10.12], [16.0, 15.97], [17.0, 17.56], [18.0, 19.85], [20.0, 21.07], [23.0, 24.54], [27.0, 27.78], [29.0, 29.35], [39.0, 39.75], [41.0, 41.89], [43.0, 43.68], [45.0, 46.16], [49.0, 51.8], [54.0, 55.21], [58.0, 58.7], [59.0, 60.03], [60.0, 60.12], [60.0, 60.49], [66.0, 72.05], [83.0, 84.25], [89.0, 88.8], [90.0, 89.99], [90.0, 91.02], [92.0, 93.9], [95.0, 95.55], [97.0, 101.44], [103.0, 105.73], [106.0, 107.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0, 0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 55.11, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.72], ["electronic music", 8.41], ["hum", 4.47]], null, null, null, null, null, [["speech", 37.92], ["music", 27.14], ["fly, housefly", 3.63]], null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.18, 0.12, -0.03, 0.56, 1.85, 1.07, 1.54, 0.78, 0.35, 0.75, 0.89, 0.68, 1.16, 2.8, 1.21, 0.7, 1.03, 0.12, 0.49, 6.05, 1.25, -0.2, -0.01, 1.02, 1.9, 0.55, 4.44, 2.73, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/elpUGB9Ap1Y_filtered.json b/annotations_filtered/elpUGB9Ap1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532448da6a841820dade7ba5b34395fb6d2e91db --- /dev/null +++ b/annotations_filtered/elpUGB9Ap1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [10.0, 10.54], [12.0, 27.13], [35.0, 48.61], [51.0, 65.87], [70.0, 78.33], [78.0, 85.67], [92.0, 97.12], [100.0, 100.16]], "keep_status": [false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 29.4, 29.56, 29.8, 29.77, 29.74, 30.71, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.1], ["hum", 19.61], ["throbbing", 15.62]], [["speech", 43.8], ["music", 12.18], ["aircraft", 9.61]], [["vehicle", 19.66], ["music", 18.64], ["aircraft", 5.31]], [["music", 40.67], ["insect", 10.26], ["fly, housefly", 10.24]], [["speech", 39.79], ["music", 18.17], ["vehicle", 7.72]], [["music", 73.18], ["throbbing", 8.33], ["hum", 3.84]], null], "duration": [1.6, 0.54, 15.13, 13.61, 14.87, 8.33, 7.67, 5.12, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/elwNOiCaRIs_filtered.json b/annotations_filtered/elwNOiCaRIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3db5c4da7d5205c8862962e2d0585980df0a2d68 --- /dev/null +++ b/annotations_filtered/elwNOiCaRIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 117.56]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [110.56]} \ No newline at end of file diff --git a/annotations_filtered/em7EcaXPJF8_filtered.json b/annotations_filtered/em7EcaXPJF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa9978a7916a59fdb5abc8a64750022b519cf23 --- /dev/null +++ b/annotations_filtered/em7EcaXPJF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 24.38], [25.0, 25.69], [27.0, 27.65], [29.0, 29.08], [31.0, 34.67]], "keep_status": [false, false, false, false, false], "silence_prob": [68.41, 0.0, 0.0, 0.0, 61.37], "audiomae_on_audioset": [null, null, null, null, null], "duration": [24.38, 0.69, 0.65, 0.08, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/em9lziI07M4_filtered.json b/annotations_filtered/em9lziI07M4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b756ab977f3698f3c49f64a3702ac7b48cb6cd8 --- /dev/null +++ b/annotations_filtered/em9lziI07M4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 43.98], [46.0, 65.45], [70.0, 108.75], [112.0, 127.2], [136.0, 136.54], [158.0, 162.23], [163.0, 179.69]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 30.84, 0.0, 31.99, 0.0, 74.29, 30.53], "audiomae_on_audioset": [null, [["music", 67.11], ["electronic music", 3.01], ["throbbing", 2.21]], null, [["music", 68.48], ["sampler", 3.12], ["electronic music", 2.87]], null, null, [["animal", 35.71], ["whale vocalization", 8.55], ["howl", 7.25]]], "duration": [31.98, 19.45, 38.75, 15.2, 0.54, 4.23, 16.69]} \ No newline at end of file diff --git a/annotations_filtered/emVaK5MoPBg_filtered.json b/annotations_filtered/emVaK5MoPBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8097995b890224225b20a8d36c784459a7f0f701 --- /dev/null +++ b/annotations_filtered/emVaK5MoPBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.82], [15.0, 15.87], [24.0, 24.11], [25.0, 25.14], [26.0, 26.38], [27.0, 27.31], [28.0, 28.19], [33.0, 33.64], [35.0, 34.96], [36.0, 36.09], [37.0, 37.08], [38.0, 38.16], [39.0, 38.91], [41.0, 41.27], [42.0, 42.23], [47.0, 47.88], [48.0, 48.84], [49.0, 49.77], [50.0, 50.92], [51.0, 51.9], [67.0, 68.39], [80.0, 80.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.82, 0.87, 0.11, 0.14, 0.38, 0.31, 0.19, 0.64, -0.04, 0.09, 0.08, 0.16, -0.09, 0.27, 0.23, 0.88, 0.84, 0.77, 0.92, 0.9, 1.39, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/emW6TopzEe0_filtered.json b/annotations_filtered/emW6TopzEe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e89fe85603804aaf46cd86767928c9c4271c93e --- /dev/null +++ b/annotations_filtered/emW6TopzEe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[123.0, 130.55], [134.0, 152.17]], "keep_status": [true, false], "silence_prob": [34.75, 30.32], "audiomae_on_audioset": [[["music", 25.31], ["animal", 9.03], ["breaking", 7.16]], [["music", 54.02], ["speech", 14.7], ["throbbing", 7.68]]], "duration": [7.55, 18.17]} \ No newline at end of file diff --git a/annotations_filtered/emW6qKMxIUU_filtered.json b/annotations_filtered/emW6qKMxIUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3e059e1eb140a948c33c92dea8f7e8799379e6c --- /dev/null +++ b/annotations_filtered/emW6qKMxIUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 88.94], [90.0, 99.0]], "keep_status": [false, false], "silence_prob": [0.0, 28.98], "audiomae_on_audioset": [null, [["music", 59.45], ["throbbing", 15.23], ["hum", 4.91]]], "duration": [58.94, 9.0]} \ No newline at end of file diff --git a/annotations_filtered/emnU7uOpYtk_filtered.json b/annotations_filtered/emnU7uOpYtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..173c3493e8daf67fecb4330a768cf8186745fa52 --- /dev/null +++ b/annotations_filtered/emnU7uOpYtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [9.0, 9.68], [10.0, 10.99], [13.0, 13.71], [33.0, 33.83], [49.0, 54.73], [61.0, 62.67], [78.0, 80.42], [84.0, 84.25], [90.0, 91.76], [95.0, 97.01], [98.0, 99.37], [101.0, 102.0], [122.0, 122.74], [126.0, 126.42], [132.0, 132.78], [138.0, 138.48], [150.0, 151.38], [168.0, 169.69], [171.0, 172.44], [174.0, 174.77], [175.0, 175.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.1, 0.0, 99.99, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.45], ["explosion", 16.28], ["music", 9.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.68, 0.99, 0.71, 0.83, 5.73, 1.67, 2.42, 0.25, 1.76, 2.01, 1.37, 1.0, 0.74, 0.42, 0.78, 0.48, 1.38, 1.69, 1.44, 0.77, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/enG1CfTbT08_filtered.json b/annotations_filtered/enG1CfTbT08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60f025edf198c02a83119d173ea3b611ed361236 --- /dev/null +++ b/annotations_filtered/enG1CfTbT08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 100.26], [103.0, 103.86], [107.0, 119.67], [121.0, 123.92], [125.0, 126.3], [128.0, 130.28], [132.0, 134.18]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 44.46, 79.24, 0.0, 76.37, 82.43], "audiomae_on_audioset": [null, null, [["sidetone", 19.67], ["busy signal", 18.54], ["speech", 11.85]], null, null, null, null], "duration": [39.26, 0.86, 12.67, 2.92, 1.3, 2.28, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/enJJeOqHbqE_filtered.json b/annotations_filtered/enJJeOqHbqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18bb908b78b0abb12dd46430238ef96c9949540c --- /dev/null +++ b/annotations_filtered/enJJeOqHbqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [7.0, 6.78], [7.0, 8.18], [10.0, 11.72], [16.0, 16.02], [17.0, 17.22], [22.0, 23.21], [31.0, 32.66], [34.0, 33.61], [34.0, 33.66], [35.0, 35.56], [36.0, 49.54], [51.0, 57.48], [67.0, 69.33], [82.0, 83.44], [88.0, 88.67], [91.0, 91.59], [97.0, 103.08], [106.0, 107.2], [108.0, 137.37], [138.0, 138.45], [140.0, 139.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.8, 30.28, 48.74, 0.0, 0.0, 0.0, 32.09, 0.0, 33.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 68.03], ["speech", 16.62], ["boing", 1.29]], [["music", 51.77], ["speech", 31.22], ["boing", 2.33]], [["frog", 27.35], ["cattle, bovinae", 11.02], ["animal", 9.67]], null, null, null, [["music", 80.67], ["musical instrument", 4.28], ["didgeridoo", 1.98]], null, [["music", 76.24], ["speech", 7.05], ["didgeridoo", 2.96]], null, null], "duration": [1.05, -0.22, 1.18, 1.72, 0.02, 0.22, 1.21, 1.66, -0.39, -0.34, 0.56, 13.54, 6.48, 2.33, 1.44, 0.67, 0.59, 6.08, 1.2, 29.37, 0.45, -0.25]} \ No newline at end of file diff --git a/annotations_filtered/enLijb7P9tg_filtered.json b/annotations_filtered/enLijb7P9tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a03b36f9ac236d87d45ee035b741a626597006 --- /dev/null +++ b/annotations_filtered/enLijb7P9tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [4.0, 5.97], [7.0, 8.48], [10.0, 11.16], [18.0, 18.94], [21.0, 22.05], [23.0, 23.38], [24.0, 24.73], [26.0, 26.35], [29.0, 29.24], [30.0, 32.12], [34.0, 34.96], [37.0, 38.06], [40.0, 40.91], [42.0, 46.68], [49.0, 50.21], [54.0, 55.95], [60.0, 61.99], [63.0, 63.9], [65.0, 66.8], [68.0, 68.0], [75.0, 74.7], [76.0, 77.3], [80.0, 80.86], [82.0, 86.91], [89.0, 90.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 1.97, 1.48, 1.16, 0.94, 1.05, 0.38, 0.73, 0.35, 0.24, 2.12, 0.96, 1.06, 0.91, 4.68, 1.21, 1.95, 1.99, 0.9, 1.8, 0.0, -0.3, 1.3, 0.86, 4.91, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/enNm82zd1Ho_filtered.json b/annotations_filtered/enNm82zd1Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e966248680d9d83b65499b6159ee86346b29b852 --- /dev/null +++ b/annotations_filtered/enNm82zd1Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.52], [7.0, 25.56], [29.0, 31.36], [33.0, 39.99], [41.0, 42.04], [45.0, 45.55], [46.0, 76.4], [79.0, 79.54], [81.0, 104.43], [105.0, 111.91], [112.0, 114.51], [116.0, 117.07], [118.0, 119.7], [121.0, 123.13], [125.0, 128.01], [129.0, 129.3], [131.0, 130.62], [134.0, 134.01], [137.0, 137.27], [138.0, 139.87], [141.0, 143.43], [144.0, 146.23], [151.0, 173.06], [174.0, 174.31], [176.0, 175.96]], "keep_status": [false, true, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.9, 29.12, 29.57, 0.0, 0.0, 0.0, 0.0, 29.76, 33.15, 36.16, 0.0, 0.0, 38.19, 40.88, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 55.53, 29.55, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.23], ["music", 15.14], ["fart", 12.14]], [["music", 60.44], ["hum", 9.36], ["throbbing", 7.53]], [["music", 25.2], ["throbbing", 20.44], ["hum", 16.93]], null, null, null, null, [["music", 53.14], ["buzz", 13.32], ["mains hum", 10.25]], [["speech", 59.5], ["music", 10.73], ["synthesizer", 3.71]], [["speech", 21.48], ["mains hum", 14.95], ["music", 13.8]], null, null, [["music", 30.52], ["electronic music", 11.21], ["hum", 4.62]], [["music", 17.75], ["speech", 12.97], ["mains hum", 9.34]], null, null, null, null, null, null, null, [["music", 54.9], ["speech", 16.39], ["groan", 10.3]], null, null], "duration": [-0.48, 18.56, 2.36, 6.99, 1.04, 0.55, 30.4, 0.54, 23.43, 6.91, 2.51, 1.07, 1.7, 2.13, 3.01, 0.3, -0.38, 0.01, 0.27, 1.87, 2.43, 2.23, 22.06, 0.31, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/ena0xfW0_Lo_filtered.json b/annotations_filtered/ena0xfW0_Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0982f63c1fac5f8b068d4bd4c7112cc99f7b5c8b --- /dev/null +++ b/annotations_filtered/ena0xfW0_Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 33.91], [37.0, 47.56], [50.0, 51.73], [56.0, 102.3], [105.0, 105.73], [108.0, 127.85]], "keep_status": [false, true, false, false, false, false], "silence_prob": [30.65, 30.84, 0.0, 0.0, 0.0, 31.66], "audiomae_on_audioset": [[["cattle, bovinae", 43.75], ["livestock, farm animals, working animals", 25.03], ["moo", 16.91]], [["artillery fire", 32.39], ["speech", 17.36], ["gunshot, gunfire", 14.36]], null, null, null, [["whale vocalization", 42.36], ["livestock, farm animals, working animals", 22.6], ["animal", 7.94]]], "duration": [18.91, 10.56, 1.73, 46.3, 0.73, 19.85]} \ No newline at end of file diff --git a/annotations_filtered/engSFG20kaA_filtered.json b/annotations_filtered/engSFG20kaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6314f7d226a00bcd2e8dd4bf4f20c03c615a326 --- /dev/null +++ b/annotations_filtered/engSFG20kaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [20.0, 38.69], [45.0, 45.17], [48.0, 86.73], [91.0, 90.75], [93.0, 150.72], [152.0, 152.27]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.25], ["hum", 15.71], ["throbbing", 7.89]], null, null, null, null, null], "duration": [0.4, 18.69, 0.17, 38.73, -0.25, 57.72, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/eo6MfN5Lcws_filtered.json b/annotations_filtered/eo6MfN5Lcws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76fea9a1651d314ddfe9a42722d5fc514b54c4bc --- /dev/null +++ b/annotations_filtered/eo6MfN5Lcws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.85], [13.0, 22.23], [22.0, 22.45], [23.0, 43.73], [46.0, 67.81], [70.0, 70.5], [71.0, 80.86], [82.0, 85.85], [87.0, 99.69], [106.0, 106.0], [107.0, 106.93], [109.0, 120.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.79, 0.0, 77.2, 35.98, 0.0, 32.67, 100.0, 100.0, 0.0, 0.0, 63.42], "audiomae_on_audioset": [null, null, null, null, [["music", 60.88], ["theremin", 8.47], ["musical instrument", 3.23]], null, [["shofar", 46.4], ["wind instrument, woodwind instrument", 31.18], ["mosquito", 12.44]], null, null, null, null, null], "duration": [-0.15, 9.23, 0.45, 20.73, 21.81, 0.5, 9.86, 3.85, 12.69, 0.0, -0.07, 11.29]} \ No newline at end of file diff --git a/annotations_filtered/eoREjwjeH30_filtered.json b/annotations_filtered/eoREjwjeH30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c887436f625f56a59c330b116e599b971afcd5d --- /dev/null +++ b/annotations_filtered/eoREjwjeH30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.97], [5.0, 36.0], [53.0, 53.81], [54.0, 54.58], [55.0, 56.24], [59.0, 59.75], [75.0, 75.68], [78.0, 79.37], [95.0, 96.09], [107.0, 107.5], [108.0, 108.89], [117.0, 130.35], [130.0, 130.38], [130.0, 130.45], [130.0, 130.49], [131.0, 130.52], [131.0, 146.75], [150.0, 164.51], [167.0, 188.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.17, 0.0, 0.0, 0.0, 0.0, 30.63, 31.39, 34.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 37.68], ["boing", 6.65], ["livestock, farm animals, working animals", 3.89]], null, null, null, null, [["music", 58.09], ["speech", 15.1], ["boing", 7.88]], [["music", 40.14], ["speech", 19.52], ["groan", 3.61]], [["music", 75.91], ["electronic music", 4.52], ["synthesizer", 2.63]]], "duration": [2.97, 31.0, 0.81, 0.58, 1.24, 0.75, 0.68, 1.37, 1.09, 0.5, 0.89, 13.35, 0.38, 0.45, 0.49, -0.48, 15.75, 14.51, 21.72]} \ No newline at end of file diff --git a/annotations_filtered/eoffuyXUhLs_filtered.json b/annotations_filtered/eoffuyXUhLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28d925c3f4757a1217fb3f12ce0d3bf1e9de9419 --- /dev/null +++ b/annotations_filtered/eoffuyXUhLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [8.0, 12.63], [13.0, 12.66], [13.0, 12.7], [13.0, 12.73], [13.0, 12.77], [13.0, 12.8], [13.0, 12.83], [13.0, 12.87], [15.0, 66.61], [69.0, 72.87], [73.0, 76.38], [80.0, 82.98], [84.0, 84.84], [87.0, 88.03], [88.0, 90.07], [92.0, 106.17], [111.0, 135.09], [136.0, 138.43], [139.0, 140.09], [141.0, 147.92], [149.0, 156.47], [157.0, 157.74], [163.0, 163.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 29.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.08, 52.8, 71.0, 0.0, 0.0, 56.86, 42.76, 40.97, 36.89, 0.0, 31.79, 40.66, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 13.92], ["rumble", 11.67], ["hum", 10.97]], null, null, null, null, null, null, null, null, [["music", 13.62], ["singing bowl", 11.92], ["speech", 9.84]], null, null, null, null, null, [["speech", 48.15], ["music", 22.02], ["sonar", 16.62]], [["music", 26.9], ["speech", 19.46], ["electronic music", 8.3]], [["whale vocalization", 41.31], ["music", 13.1], ["hum", 4.93]], null, [["speech", 48.5], ["hum", 14.14], ["music", 7.26]], [["music", 43.73], ["hum", 23.69], ["mains hum", 12.1]], null, null], "duration": [0.48, 4.63, -0.34, -0.3, -0.27, -0.23, -0.2, -0.17, -0.13, 51.61, 3.87, 3.38, 2.98, 0.84, 1.03, 2.07, 14.17, 24.09, 2.43, 1.09, 6.92, 7.47, 0.74, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/eolBcBPpwyE_filtered.json b/annotations_filtered/eolBcBPpwyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..784a22b70b2fe5dce50565145c559bf89b7bdc35 --- /dev/null +++ b/annotations_filtered/eolBcBPpwyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.73], [21.0, 27.45], [32.0, 33.03], [34.0, 40.95], [43.0, 44.05], [47.0, 47.17], [52.0, 52.73], [54.0, 55.12]], "keep_status": [true, true, false, false, false, false, false, false], "silence_prob": [33.13, 32.64, 0.0, 29.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 32.04], ["cattle, bovinae", 19.98], ["moo", 14.05]], [["music", 42.72], ["theremin", 16.57], ["didgeridoo", 8.98]], null, [["music", 86.8], ["electronic music", 2.38], ["musical instrument", 1.01]], null, null, null, null], "duration": [4.73, 6.45, 1.03, 6.95, 1.05, 0.17, 0.73, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/ep-ieEG06qg_filtered.json b/annotations_filtered/ep-ieEG06qg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f59f1470e7b735e7e7fc8833daa5704b1b180cc3 --- /dev/null +++ b/annotations_filtered/ep-ieEG06qg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [7.0, 7.28], [7.0, 7.5], [16.0, 17.22], [18.0, 19.26], [19.0, 20.12], [21.0, 21.42], [30.0, 30.32], [38.0, 39.78], [44.0, 44.1], [45.0, 45.64], [47.0, 47.36], [52.0, 54.09], [57.0, 57.2], [59.0, 59.43], [63.0, 64.72], [71.0, 74.07], [75.0, 75.84], [78.0, 79.05], [82.0, 82.56], [84.0, 84.96], [86.0, 86.43], [90.0, 92.72], [93.0, 95.64], [96.0, 98.29], [103.0, 104.4], [107.0, 111.54], [114.0, 116.16], [117.0, 117.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 83.52, 99.76, 0.0, 99.99, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 0.28, 0.5, 1.22, 1.26, 1.12, 0.42, 0.32, 1.78, 0.1, 0.64, 0.36, 2.09, 0.2, 0.43, 1.72, 3.07, 0.84, 1.05, 0.56, 0.96, 0.43, 2.72, 2.64, 2.29, 1.4, 4.54, 2.16, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/epBGWHCrfr4_filtered.json b/annotations_filtered/epBGWHCrfr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..092e27501871afc106e8a72a896d2325a74ae7c7 --- /dev/null +++ b/annotations_filtered/epBGWHCrfr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [5.0, 5.17], [6.0, 12.5], [24.0, 42.38], [44.0, 43.95], [49.0, 50.85], [57.0, 63.71], [65.0, 66.77], [68.0, 68.15], [71.0, 73.25], [83.0, 92.57], [94.0, 94.27], [95.0, 97.8]], "keep_status": [false, false, true, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.68, 36.46, 0.0, 0.0, 34.34, 0.0, 0.0, 33.71, 32.35, 0.0, 33.16], "audiomae_on_audioset": [null, null, [["music", 15.93], ["speech", 15.57], ["mains hum", 13.12]], [["mains hum", 33.23], ["hum", 32.61], ["music", 18.54]], null, null, [["cattle, bovinae", 29.5], ["moo", 23.72], ["livestock, farm animals, working animals", 16.1]], null, null, [["speech", 14.95], ["hum", 10.55], ["sidetone", 10.36]], [["music", 47.31], ["throbbing", 14.18], ["hum", 9.55]], null, [["mains hum", 53.32], ["hum", 37.12], ["music", 1.76]]], "duration": [1.05, 0.17, 6.5, 18.38, -0.05, 1.85, 6.71, 1.77, 0.15, 2.25, 9.57, 0.27, 2.8]} \ No newline at end of file diff --git a/annotations_filtered/epHCMiCtt3M_filtered.json b/annotations_filtered/epHCMiCtt3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9811bd8b8670b89f21db584829c3dfed3b9efaa --- /dev/null +++ b/annotations_filtered/epHCMiCtt3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.18], [14.0, 14.08], [19.0, 19.08], [22.0, 22.35], [23.0, 24.07], [26.0, 26.49], [38.0, 38.8], [41.0, 42.77], [43.0, 44.22], [54.0, 54.63], [61.0, 61.16], [68.0, 68.93], [75.0, 75.68], [77.0, 78.0], [79.0, 80.01], [81.0, 82.88], [105.0, 106.66], [109.0, 110.59], [113.0, 113.98], [114.0, 117.76]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.81], "audiomae_on_audioset": [[["music", 50.03], ["synthesizer", 7.32], ["musical instrument", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.52], ["didgeridoo", 30.44], ["musical instrument", 3.49]]], "duration": [3.18, 0.08, 0.08, 0.35, 1.07, 0.49, 0.8, 1.77, 1.22, 0.63, 0.16, 0.93, 0.68, 1.0, 1.01, 1.88, 1.66, 1.59, 0.98, 3.76]} \ No newline at end of file diff --git a/annotations_filtered/epupZLvDDts_filtered.json b/annotations_filtered/epupZLvDDts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f83a107cfefed98c733d12efb32af925ddd4409 --- /dev/null +++ b/annotations_filtered/epupZLvDDts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.41], [6.0, 7.52], [10.0, 21.12], [22.0, 40.63], [42.0, 43.14], [45.0, 47.01], [49.0, 50.5], [51.0, 55.65], [59.0, 94.53], [95.0, 99.27], [100.0, 101.41], [102.0, 104.14], [106.0, 112.16], [113.0, 128.49], [129.0, 130.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 0.0, 53.59, 96.66, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 99.1, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, 1.52, 11.12, 18.63, 1.14, 2.01, 1.5, 4.65, 35.53, 4.27, 1.41, 2.14, 6.16, 15.49, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/eq3-F_738gA_filtered.json b/annotations_filtered/eq3-F_738gA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2eee03ef33c0e7635b36944c9cd9578c7eb5add7 --- /dev/null +++ b/annotations_filtered/eq3-F_738gA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [0.0, 0.43], [0.0, 0.5], [3.0, 4.16], [5.0, 6.37], [7.0, 8.14], [11.0, 11.74], [13.0, 14.34], [17.0, 17.56], [28.0, 29.17], [33.0, 33.25], [35.0, 35.18], [37.0, 37.56], [52.0, 53.18], [53.0, 54.73], [56.0, 56.89], [60.0, 61.01], [64.0, 66.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.87], ["speech", 3.49], ["synthesizer", 3.2]]], "duration": [0.36, 0.43, 0.5, 1.16, 1.37, 1.14, 0.74, 1.34, 0.56, 1.17, 0.25, 0.18, 0.56, 1.18, 1.73, 0.89, 1.01, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/eq3vD93GgLs_filtered.json b/annotations_filtered/eq3vD93GgLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11ade6fc935cfefb35aa00789ba9691a6e3eb02f --- /dev/null +++ b/annotations_filtered/eq3vD93GgLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [12.0, 12.29], [13.0, 13.91], [18.0, 20.39], [21.0, 23.41], [26.0, 26.25], [35.0, 35.75], [38.0, 45.22], [46.0, 46.74], [49.0, 49.69], [52.0, 109.63]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.02, 38.16, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.37], ["didgeridoo", 7.36], ["musical instrument", 5.59]], [["music", 45.83], ["hum", 2.54], ["musical instrument", 2.45]], null, null, [["speech", 45.44], ["rumble", 13.62], ["music", 10.65]], null, null, null], "duration": [0.49, 0.29, 0.91, 2.39, 2.41, 0.25, 0.75, 7.22, 0.74, 0.69, 57.63]} \ No newline at end of file diff --git a/annotations_filtered/eq5NSAyQEtI_filtered.json b/annotations_filtered/eq5NSAyQEtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d4eec7620683f94397fafa913d89b94119b3468 --- /dev/null +++ b/annotations_filtered/eq5NSAyQEtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [9.0, 8.78], [10.0, 10.45], [12.0, 12.02], [14.0, 14.15], [18.0, 18.6], [21.0, 21.54], [23.0, 26.92], [29.0, 29.73], [30.0, 32.98], [34.0, 38.38], [40.0, 40.64], [44.0, 46.23], [49.0, 50.3], [52.0, 54.36], [56.0, 56.89], [58.0, 69.7], [72.0, 72.86], [74.0, 75.68], [79.0, 80.76], [84.0, 89.48], [93.0, 95.55], [97.0, 102.95], [103.0, 103.45], [103.0, 113.58], [115.0, 119.57], [123.0, 125.12], [127.0, 130.65], [132.0, 133.25], [137.0, 140.21], [143.0, 151.6], [154.0, 160.57], [161.0, 164.0], [167.0, 168.29]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, true, false, false, false, false, false, true, true, false, false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.27, 0.0, 34.12, 34.2, 0.0, 41.81, 0.0, 49.4, 0.0, 33.84, 0.0, 0.0, 0.0, 39.78, 31.0, 29.94, 0.0, 29.93, 30.28, 30.48, 30.42, 0.0, 30.04, 31.18, 32.74, 32.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["burst, pop", 12.12], ["arrow", 11.67], ["gunshot, gunfire", 11.57]], null, [["music", 28.11], ["gong", 16.68], ["speech", 9.25]], [["music", 65.51], ["musical instrument", 6.2], ["guitar", 5.19]], null, [["music", 25.84], ["finger snapping", 18.97], ["synthesizer", 8.51]], null, [["music", 27.29], ["speech", 21.86], ["theremin", 13.14]], null, [["speech", 56.33], ["music", 11.75], ["hum", 10.18]], null, null, null, [["bee, wasp, etc.", 10.26], ["fly, housefly", 7.38], ["noise", 6.99]], [["music", 32.68], ["musical instrument", 10.57], ["speech", 6.84]], [["music", 59.34], ["effects unit", 9.97], ["musical instrument", 6.56]], null, [["music", 61.59], ["musical instrument", 8.87], ["guitar", 4.47]], [["music", 41.59], ["musical instrument", 9.47], ["theremin", 7.93]], [["music", 38.73], ["didgeridoo", 13.18], ["guitar", 7.7]], [["speech", 49.92], ["music", 15.11], ["didgeridoo", 9.9]], null, [["speech", 58.45], ["music", 12.36], ["vehicle", 4.07]], [["music", 70.92], ["speech", 9.41], ["dog", 2.24]], [["speech", 27.3], ["music", 25.27], ["theremin", 6.03]], [["music", 63.4], ["musical instrument", 7.64], ["theremin", 4.11]], null], "duration": [0.93, -0.22, 0.45, 0.02, 0.15, 0.6, 0.54, 3.92, 0.73, 2.98, 4.38, 0.64, 2.23, 1.3, 2.36, 0.89, 11.7, 0.86, 1.68, 1.76, 5.48, 2.55, 5.95, 0.45, 10.58, 4.57, 2.12, 3.65, 1.25, 3.21, 8.6, 6.57, 3.0, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/eqIkFkmb054_filtered.json b/annotations_filtered/eqIkFkmb054_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb7df674874c68dd415d44f0b7bcdefbbbc2ea2 --- /dev/null +++ b/annotations_filtered/eqIkFkmb054_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 22.33], [23.0, 27.82], [31.0, 38.23], [39.0, 43.34], [46.0, 48.81], [50.0, 51.7], [53.0, 54.48], [55.0, 55.95], [59.0, 59.93], [60.0, 79.37], [82.0, 100.52], [102.0, 102.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 99.65, 89.36, 99.71, 99.36, 0.0, 0.0, 0.0, 0.0, 97.54, 98.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.33, 4.82, 7.23, 4.34, 2.81, 1.7, 1.48, 0.95, 0.93, 19.37, 18.52, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/eqdLKw173WI_filtered.json b/annotations_filtered/eqdLKw173WI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4c93b156f3a49493124a71073a3559db5904cda --- /dev/null +++ b/annotations_filtered/eqdLKw173WI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [13.0, 22.98], [26.0, 29.73], [30.0, 30.45], [35.0, 40.17], [40.0, 40.2], [40.0, 40.29], [40.0, 42.18], [43.0, 43.39], [46.0, 46.84], [48.0, 48.46], [52.0, 52.69], [54.0, 55.83], [57.0, 60.69], [64.0, 63.96], [65.0, 66.87], [68.0, 69.57], [72.0, 72.18], [75.0, 77.43], [83.0, 84.18], [85.0, 85.75], [87.0, 100.14], [101.0, 102.84], [105.0, 106.89], [109.0, 110.32], [114.0, 115.97], [117.0, 118.57], [121.0, 122.12]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.55, 34.22, 0.0, 34.25, 0.0, 0.0, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 0.0, 32.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.67], ["throbbing", 10.88], ["hum", 9.89]], [["music", 78.18], ["throbbing", 5.49], ["hum", 3.87]], null, [["throbbing", 36.98], ["music", 36.04], ["hum", 9.81]], null, null, [["music", 39.3], ["throbbing", 19.78], ["hum", 8.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.29], ["throbbing", 9.03], ["electronic music", 4.77]], null, null, null, null, null, null], "duration": [1.51, 9.98, 3.73, 0.45, 5.17, 0.2, 0.29, 2.18, 0.39, 0.84, 0.46, 0.69, 1.83, 3.69, -0.04, 1.87, 1.57, 0.18, 2.43, 1.18, 0.75, 13.14, 1.84, 1.89, 1.32, 1.97, 1.57, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/eqk4fOK2VU8_filtered.json b/annotations_filtered/eqk4fOK2VU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5431fc4bd6296c757a97a6056441fb426aa2aab --- /dev/null +++ b/annotations_filtered/eqk4fOK2VU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [3.0, 3.23], [4.0, 7.25], [8.0, 10.08], [20.0, 23.53], [24.0, 24.71], [26.0, 25.96], [29.0, 29.57], [33.0, 36.39], [37.0, 37.84], [41.0, 50.9], [52.0, 57.5], [66.0, 68.47], [70.0, 70.36], [82.0, 82.32], [83.0, 86.86], [90.0, 109.63], [110.0, 111.15], [111.0, 112.29], [113.0, 117.91], [118.0, 119.15], [120.0, 127.99], [130.0, 132.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.37, 81.89, 99.21, 0.0, 0.0, 0.0, 100.0, 0.0, 81.89, 54.83, 100.0, 0.0, 0.0, 97.83, 75.07, 0.0, 0.0, 75.07, 0.0, 94.37, 41.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 87.64], ["inside, small room", 3.15], ["radio", 0.88]]], "duration": [0.24, 0.23, 3.25, 2.08, 3.53, 0.71, -0.04, 0.57, 3.39, 0.84, 9.9, 5.5, 2.47, 0.36, 0.32, 3.86, 19.63, 1.15, 1.29, 4.91, 1.15, 7.99, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/eqv02JDVQ1o_filtered.json b/annotations_filtered/eqv02JDVQ1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e6717e61f1a856e96c3798f65c3720df24de14f --- /dev/null +++ b/annotations_filtered/eqv02JDVQ1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 4.78], [10.0, 11.1], [13.0, 13.49], [15.0, 15.72], [18.0, 18.69], [20.0, 20.06], [29.0, 38.38], [44.0, 44.63], [49.0, 50.77], [54.0, 53.72], [56.0, 57.21], [59.0, 59.22], [65.0, 65.33], [76.0, 80.38], [83.0, 83.32], [85.0, 85.95], [88.0, 89.23], [94.0, 97.5], [99.0, 99.32], [101.0, 101.95], [102.0, 102.84], [108.0, 109.04], [110.0, 110.29], [113.0, 116.88], [120.0, 120.85], [126.0, 126.52], [139.0, 141.1], [145.0, 145.76], [149.0, 149.34]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 99.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["creak", 20.84], ["music", 7.75], ["noise", 6.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.78, 1.1, 0.49, 0.72, 0.69, 0.06, 9.38, 0.63, 1.77, -0.28, 1.21, 0.22, 0.33, 4.38, 0.32, 0.95, 1.23, 3.5, 0.32, 0.95, 0.84, 1.04, 0.29, 3.88, 0.85, 0.52, 2.1, 0.76, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/er2a5WhYU-4_filtered.json b/annotations_filtered/er2a5WhYU-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1d915921a86da37bc06013b66a323e4318bff3f --- /dev/null +++ b/annotations_filtered/er2a5WhYU-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.04], [38.0, 45.67], [49.0, 51.12], [53.0, 75.25], [76.0, 76.35], [76.0, 76.77]], "keep_status": [false, true, true, true, false, false], "silence_prob": [0.0, 30.41, 30.35, 29.49, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.64], ["throbbing", 13.07], ["synthesizer", 10.69]], [["music", 12.31], ["noise", 11.87], ["synthesizer", 8.39]], [["music", 33.68], ["hum", 10.85], ["throbbing", 9.38]], null, null], "duration": [1.04, 7.67, 2.12, 22.25, 0.35, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/er6wSXJC57U_filtered.json b/annotations_filtered/er6wSXJC57U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..026bf72722b8b1e8ab6197a165725a6818e39736 --- /dev/null +++ b/annotations_filtered/er6wSXJC57U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.93], [10.0, 23.09], [26.0, 35.53], [40.0, 51.95], [52.0, 52.44], [53.0, 110.25], [111.0, 112.02], [115.0, 116.31], [119.0, 119.11], [121.0, 121.31]], "keep_status": [false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.86, 29.61, 29.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["animal", 33.8], ["speech", 23.74], ["livestock, farm animals, working animals", 11.1]], [["music", 42.96], ["speech", 12.18], ["didgeridoo", 3.94]], [["music", 18.74], ["animal", 18.58], ["grunt", 6.89]], null, null, null, null, null, null], "duration": [1.93, 13.09, 9.53, 11.95, 0.44, 57.25, 1.02, 1.31, 0.11, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/erE6UlOi3E0_filtered.json b/annotations_filtered/erE6UlOi3E0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39eb21559151c3d8d36a0d6729d25644bd983e9c --- /dev/null +++ b/annotations_filtered/erE6UlOi3E0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 49.77], [52.0, 55.21], [59.0, 62.09], [63.0, 74.19], [75.0, 75.17], [76.0, 99.37], [100.0, 114.15], [117.0, 124.56]], "keep_status": [true, true, true, true, false, false, false, true], "silence_prob": [31.3, 31.33, 32.86, 31.07, 0.0, 31.21, 31.33, 32.56], "audiomae_on_audioset": [[["music", 36.3], ["vehicle", 7.24], ["hum", 7.13]], [["music", 29.47], ["mosquito", 25.06], ["fly, housefly", 7.75]], [["music", 49.56], ["cacophony", 8.77], ["musical instrument", 4.84]], [["music", 36.99], ["speech", 15.96], ["buzz", 8.37]], null, [["music", 46.71], ["buzz", 26.32], ["vehicle", 4.09]], [["mains hum", 40.99], ["hum", 30.25], ["music", 16.36]], [["music", 40.47], ["foghorn", 20.53], ["trombone", 5.31]]], "duration": [11.77, 3.21, 3.09, 11.19, 0.17, 23.37, 14.15, 7.56]} \ No newline at end of file diff --git a/annotations_filtered/erILyrdpSqs_filtered.json b/annotations_filtered/erILyrdpSqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcdf869452cfaebfb3aed282041cdc2270805817 --- /dev/null +++ b/annotations_filtered/erILyrdpSqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.84], [5.0, 5.37], [7.0, 7.21], [28.0, 28.76], [55.0, 55.78], [82.0, 82.58], [91.0, 90.75], [95.0, 96.15], [109.0, 109.39], [111.0, 111.33], [131.0, 132.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.84, 0.37, 0.21, 0.76, 0.78, 0.58, -0.25, 1.15, 0.39, 0.33, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/erX0T5r5xbE_filtered.json b/annotations_filtered/erX0T5r5xbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..420326a8b7270db5e3605a57a1213965a017e4b3 --- /dev/null +++ b/annotations_filtered/erX0T5r5xbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.36], [25.0, 26.05], [28.0, 28.61], [32.0, 32.9], [39.0, 39.93], [41.0, 47.24], [50.0, 52.86], [55.0, 56.44], [60.0, 61.26], [65.0, 67.56], [73.0, 73.74], [74.0, 74.51], [75.0, 77.68], [84.0, 84.28], [91.0, 91.07], [93.0, 93.55], [94.0, 95.42], [106.0, 106.74], [108.0, 108.4], [113.0, 113.58], [117.0, 116.94], [118.0, 118.96], [120.0, 121.39], [122.0, 122.62], [123.0, 148.17], [150.0, 150.53], [172.0, 172.29], [173.0, 174.19], [182.0, 181.89], [184.0, 184.03], [185.0, 189.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 44.87, 0.0, 0.0, 80.82, 0.0, 0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8], "audiomae_on_audioset": [null, null, null, null, null, [["music", 60.41], ["theremin", 8.72], ["musical instrument", 3.54]], [["speech", 41.85], ["music", 28.97], ["theremin", 4.05]], null, null, null, null, null, [["music", 54.11], ["speech", 13.18], ["didgeridoo", 2.39]], null, null, null, null, null, null, null, null, null, null, null, [["music", 45.58], ["didgeridoo", 18.34], ["wind instrument, woodwind instrument", 7.27]], null, null, null, null, null, null], "duration": [0.36, 1.05, 0.61, 0.9, 0.93, 6.24, 2.86, 1.44, 1.26, 2.56, 0.74, 0.51, 2.68, 0.28, 0.07, 0.55, 1.42, 0.74, 0.4, 0.58, -0.06, 0.96, 1.39, 0.62, 25.17, 0.53, 0.29, 1.19, -0.11, 0.03, 4.7]} \ No newline at end of file diff --git a/annotations_filtered/ermD7PGA3Do_filtered.json b/annotations_filtered/ermD7PGA3Do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe2cc183c35d6693968293239969b99d693db97e --- /dev/null +++ b/annotations_filtered/ermD7PGA3Do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 28.39], [32.0, 51.48], [53.0, 53.96], [57.0, 59.54], [64.0, 64.39], [66.0, 68.13], [69.0, 70.02], [71.0, 73.2], [80.0, 82.76], [84.0, 95.94], [97.0, 100.26], [103.0, 104.73], [111.0, 112.65], [114.0, 115.15], [119.0, 119.38], [120.0, 156.9], [158.0, 158.06], [159.0, 159.63], [162.0, 164.91], [166.0, 172.83]], "keep_status": [true, true, false, true, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.84, 30.2, 0.0, 33.46, 0.0, 31.71, 0.0, 31.86, 32.78, 28.89, 31.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 70.58], "audiomae_on_audioset": [[["music", 14.26], ["hum", 11.14], ["car", 10.5]], [["rumble", 50.81], ["hum", 9.7], ["speech", 8.91]], null, [["hum", 26.98], ["music", 11.52], ["sonar", 8.63]], null, [["hum", 51.98], ["mains hum", 10.76], ["throbbing", 8.26]], null, [["hum", 47.71], ["throbbing", 7.25], ["chirp tone", 6.42]], [["hum", 37.31], ["rumble", 12.6], ["throbbing", 10.94]], [["speech", 42.34], ["hum", 17.54], ["rumble", 6.79]], [["whale vocalization", 26.31], ["hum", 24.91], ["chirp tone", 8.82]], null, null, null, null, null, null, null, null, null], "duration": [11.39, 19.48, 0.96, 2.54, 0.39, 2.13, 1.02, 2.2, 2.76, 11.94, 3.26, 1.73, 1.65, 1.15, 0.38, 36.9, 0.06, 0.63, 2.91, 6.83]} \ No newline at end of file diff --git a/annotations_filtered/ersxqFwDkWA_filtered.json b/annotations_filtered/ersxqFwDkWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5779a67a80033c904575ad1598734524ce2e1047 --- /dev/null +++ b/annotations_filtered/ersxqFwDkWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.69], [13.0, 21.46], [25.0, 32.98], [34.0, 34.25], [35.0, 36.34], [37.0, 68.15], [72.0, 120.34], [122.0, 122.13], [124.0, 139.13], [143.0, 148.1]], "keep_status": [false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 33.79, 42.76, 0.0, 0.0, 0.0, 0.0, 0.0, 31.78, 36.45], "audiomae_on_audioset": [null, [["vehicle", 13.62], ["synthesizer", 10.33], ["music", 7.94]], [["music", 76.37], ["timpani", 3.58], ["musical instrument", 3.25]], null, null, null, null, null, [["music", 53.52], ["hum", 9.49], ["theremin", 3.15]], [["music", 44.05], ["synthesizer", 17.87], ["ambient music", 8.91]]], "duration": [1.69, 8.46, 7.98, 0.25, 1.34, 31.15, 48.34, 0.13, 15.13, 5.1]} \ No newline at end of file diff --git a/annotations_filtered/es83ejXi5wg_filtered.json b/annotations_filtered/es83ejXi5wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ede15f5566c590fabce773d9f750c5ce0abf50ea --- /dev/null +++ b/annotations_filtered/es83ejXi5wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.34], [11.0, 12.01], [12.0, 18.98], [21.0, 21.95], [23.0, 24.17], [25.0, 26.2], [27.0, 39.45], [41.0, 45.96], [48.0, 51.41], [52.0, 66.58], [68.0, 70.24], [73.0, 73.09], [75.0, 75.9], [77.0, 77.8], [79.0, 80.11], [82.0, 92.42], [97.0, 100.75], [103.0, 111.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [90.78, 0.0, 99.05, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 90.08, 0.0, 0.0, 0.0, 0.0, 44.87, 99.71, 72.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 32.5], ["music", 16.14], ["animal", 6.96]], null, null], "duration": [7.34, 1.01, 6.98, 0.95, 1.17, 1.2, 12.45, 4.96, 3.41, 14.58, 2.24, 0.09, 0.9, 0.8, 1.11, 10.42, 3.75, 8.87]} \ No newline at end of file diff --git a/annotations_filtered/esFVrrZCvwA_filtered.json b/annotations_filtered/esFVrrZCvwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bba2b4f607837f2ddebe859e1bae44828568e6a3 --- /dev/null +++ b/annotations_filtered/esFVrrZCvwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 30.5], [36.0, 35.87]], "keep_status": [true, false], "silence_prob": [28.98, 0.0], "audiomae_on_audioset": [[["music", 62.49], ["car", 3.49], ["motorcycle", 3.02]], null], "duration": [11.5, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/esHXIrYgSzo_filtered.json b/annotations_filtered/esHXIrYgSzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c141caf36e438d41f7c982510e58f8475c762575 --- /dev/null +++ b/annotations_filtered/esHXIrYgSzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.42], [4.0, 5.34], [7.0, 15.84], [23.0, 23.18], [29.0, 30.5], [32.0, 33.13], [34.0, 34.3], [36.0, 36.49], [38.0, 40.02], [45.0, 45.33], [52.0, 52.95], [69.0, 69.74], [72.0, 71.91], [75.0, 75.39], [80.0, 81.36], [83.0, 83.62], [85.0, 86.91], [94.0, 94.31], [98.0, 98.39], [101.0, 105.51], [132.0, 131.87], [138.0, 138.11], [140.0, 140.48], [143.0, 154.8]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.7, 0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 35.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.06, 0.0, 0.0, 0.0, 30.37], "audiomae_on_audioset": [[["music", 49.71], ["musical instrument", 3.24], ["crowd", 2.69]], null, [["music", 80.81], ["christmas music", 1.47], ["lullaby", 1.41]], null, null, null, null, null, [["music", 11.78], ["hum", 5.76], ["crowd", 5.36]], null, null, null, null, null, null, null, null, null, null, [["music", 37.37], ["fly, housefly", 10.5], ["buzz", 6.03]], null, null, null, [["music", 85.8], ["quack", 2.76], ["middle eastern music", 1.87]]], "duration": [2.42, 1.34, 8.84, 0.18, 1.5, 1.13, 0.3, 0.49, 2.02, 0.33, 0.95, 0.74, -0.09, 0.39, 1.36, 0.62, 1.91, 0.31, 0.39, 4.51, -0.13, 0.11, 0.48, 11.8]} \ No newline at end of file diff --git a/annotations_filtered/esHt1mAYF-g_filtered.json b/annotations_filtered/esHt1mAYF-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9ad74608b233a8652f3fa4bb21c7f61bc5f1c96 --- /dev/null +++ b/annotations_filtered/esHt1mAYF-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 47.16], [53.0, 54.16], [55.0, 57.43], [109.0, 113.39], [120.0, 120.93]], "keep_status": [true, false, true, true, false], "silence_prob": [33.38, 0.0, 31.05, 33.34, 0.0], "audiomae_on_audioset": [[["speech", 51.32], ["whack, thwack", 10.26], ["boing", 6.85]], null, [["thunk", 12.05], ["breaking", 8.78], ["whack, thwack", 8.72]], [["speech", 33.27], ["whack, thwack", 12.56], ["music", 11.66]], null], "duration": [5.16, 1.16, 2.43, 4.39, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/esJNnh-d2E0_filtered.json b/annotations_filtered/esJNnh-d2E0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76fda857b2f86e357e17b2d55bfedc9506244533 --- /dev/null +++ b/annotations_filtered/esJNnh-d2E0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.91], [14.0, 14.07], [17.0, 16.9], [21.0, 22.64], [29.0, 30.96], [32.0, 33.81], [35.0, 37.17], [38.0, 40.76], [42.0, 47.53], [49.0, 54.23], [55.0, 59.12], [60.0, 70.12], [71.0, 88.43], [90.0, 90.69], [93.0, 118.71], [119.0, 120.04], [120.0, 123.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 98.93, 99.95, 93.13, 96.77, 94.95, 84.98, 0.0, 66.15, 0.0, 57.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.91, 0.07, -0.1, 1.64, 1.96, 1.81, 2.17, 2.76, 5.53, 5.23, 4.12, 10.12, 17.43, 0.69, 25.71, 1.04, 3.31]} \ No newline at end of file diff --git a/annotations_filtered/esQgzR6gTjw_filtered.json b/annotations_filtered/esQgzR6gTjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98947f4b9280a1bac8892533c37602f07b65cbe4 --- /dev/null +++ b/annotations_filtered/esQgzR6gTjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [8.0, 8.8], [15.0, 18.5], [20.0, 21.46], [25.0, 25.41], [26.0, 28.32], [33.0, 33.64], [39.0, 39.8], [43.0, 44.85], [46.0, 50.7], [52.0, 53.3], [56.0, 59.75], [62.0, 63.61], [66.0, 67.91], [69.0, 69.7], [71.0, 74.09], [77.0, 79.34], [80.0, 88.05], [91.0, 93.65], [95.0, 96.13], [102.0, 106.39], [108.0, 122.86]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.04, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 36.69, 0.0, 73.82, 0.0, 0.0, 0.0, 79.76, 71.87, 62.27, 52.98, 0.0, 61.77, 56.93], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 37.22], ["mosquito", 16.34], ["insect", 16.06]], null, null, null, [["hum", 16.68], ["speech", 16.07], ["sidetone", 14.34]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.8, 3.5, 1.46, 0.41, 2.32, 0.64, 0.8, 1.85, 4.7, 1.3, 3.75, 1.61, 1.91, 0.7, 3.09, 2.34, 8.05, 2.65, 1.13, 4.39, 14.86]} \ No newline at end of file diff --git a/annotations_filtered/esXVSyflpDU_filtered.json b/annotations_filtered/esXVSyflpDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95e5237a4e30cc404568005cf4b135d001f11c68 --- /dev/null +++ b/annotations_filtered/esXVSyflpDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [8.0, 8.4], [13.0, 14.37], [15.0, 18.47], [22.0, 22.38], [25.0, 25.46], [30.0, 30.79], [39.0, 39.5], [76.0, 76.05], [82.0, 82.53], [90.0, 90.31], [126.0, 126.74]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.39], ["trombone", 8.61], ["brass instrument", 8.03]], null, null, null, null, null, null, null, null], "duration": [0.34, 0.4, 1.37, 3.47, 0.38, 0.46, 0.79, 0.5, 0.05, 0.53, 0.31, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/esg4w4b2xvc_filtered.json b/annotations_filtered/esg4w4b2xvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edf89ec225afe5aa1dba351b3ee82f53d496f763 --- /dev/null +++ b/annotations_filtered/esg4w4b2xvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [6.0, 12.12], [15.0, 15.45], [18.0, 18.05], [19.0, 19.72], [25.0, 29.39], [31.0, 31.6], [37.0, 37.86], [39.0, 40.53], [43.0, 52.39], [57.0, 56.69], [64.0, 68.81], [69.0, 70.17], [74.0, 80.37], [85.0, 86.68], [91.0, 95.71], [100.0, 100.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 35.84, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 30.43, 0.0, 44.69, 0.0, 30.38, 0.0, 34.55, 0.0], "audiomae_on_audioset": [null, [["speech", 47.22], ["music", 28.73], ["sidetone", 10.83]], null, null, null, null, null, null, null, [["music", 52.01], ["throbbing", 28.43], ["hum", 8.1]], null, [["hum", 16.12], ["throbbing", 14.32], ["music", 11.77]], null, [["music", 61.65], ["squish", 13.47], ["drip", 5.16]], null, [["music", 47.05], ["throbbing", 34.56], ["hum", 6.02]], null], "duration": [1.59, 6.12, 0.45, 0.05, 0.72, 4.39, 0.6, 0.86, 1.53, 9.39, -0.31, 4.81, 1.17, 6.37, 1.68, 4.71, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/esrBtSFDlEU_filtered.json b/annotations_filtered/esrBtSFDlEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5a1eb06bb270dca185e2e4aa8118209a5e5e60 --- /dev/null +++ b/annotations_filtered/esrBtSFDlEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.2], [21.0, 30.25], [32.0, 33.05], [39.0, 40.44], [42.0, 42.43], [44.0, 44.12], [44.0, 45.06], [47.0, 47.24], [48.0, 49.72], [50.0, 52.32], [54.0, 55.31], [60.0, 62.16], [63.0, 64.57], [67.0, 68.89], [69.0, 69.45], [71.0, 72.98], [78.0, 79.07], [88.0, 88.96], [97.0, 97.16], [98.0, 97.9], [102.0, 108.28], [110.0, 114.69], [118.0, 118.13]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.39, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.5, 29.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 58.01], ["music", 6.12], ["sidetone", 5.18]], null, null, null, null, null, null, null, null, null, null, [["music", 52.49], ["speech", 20.34], ["didgeridoo", 7.72]], [["didgeridoo", 65.31], ["music", 16.32], ["speech", 4.42]], null], "duration": [1.2, 9.25, 1.05, 1.44, 0.43, 0.12, 1.06, 0.24, 1.72, 2.32, 1.31, 2.16, 1.57, 1.89, 0.45, 1.98, 1.07, 0.96, 0.16, -0.1, 6.28, 4.69, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/etixMqUt8Ak_filtered.json b/annotations_filtered/etixMqUt8Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b53914c4eea26aa5e301dc92d1d3a30822740db --- /dev/null +++ b/annotations_filtered/etixMqUt8Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [11.0, 11.42], [15.0, 18.62], [38.0, 47.66], [71.0, 71.47]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 60.89, 37.55, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 24.82], ["snicker", 20.73], ["livestock, farm animals, working animals", 14.4]], null], "duration": [0.33, 0.42, 3.62, 9.66, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/etyH2OUxVuQ_filtered.json b/annotations_filtered/etyH2OUxVuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1892facf26f562bca80b8b895b6a642d55204ba0 --- /dev/null +++ b/annotations_filtered/etyH2OUxVuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [9.0, 8.95], [14.0, 15.13], [19.0, 19.53], [22.0, 22.23], [24.0, 23.99], [26.0, 26.97], [37.0, 37.72], [49.0, 49.28], [54.0, 54.41], [56.0, 56.44], [58.0, 59.09], [66.0, 66.41], [74.0, 74.07], [76.0, 76.77], [79.0, 79.54], [84.0, 84.82], [88.0, 88.21], [89.0, 89.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, -0.05, 1.13, 0.53, 0.23, -0.01, 0.97, 0.72, 0.28, 0.41, 0.44, 1.09, 0.41, 0.07, 0.77, 0.54, 0.82, 0.21, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/eu-afVml4MM_filtered.json b/annotations_filtered/eu-afVml4MM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0710983210447978d212b63d6df1a5e926fe915 --- /dev/null +++ b/annotations_filtered/eu-afVml4MM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 40.26], [41.0, 43.95], [48.0, 53.86], [55.0, 55.86], [59.0, 59.54], [64.0, 64.52], [67.0, 67.27], [69.0, 69.38], [74.0, 74.01], [75.0, 75.95], [79.0, 82.09], [82.0, 96.38], [97.0, 97.63], [112.0, 112.46], [117.0, 116.58], [118.0, 119.04], [121.0, 122.01], [122.0, 123.52], [124.0, 125.29], [126.0, 126.67], [129.0, 129.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.93, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.06, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 48.37], ["moo", 37.57], ["livestock, farm animals, working animals", 6.73]], [["speech", 43.31], ["explosion", 28.3], ["burst, pop", 5.97]], null, null, null, null, null, null, null, null, null], "duration": [0.26, 2.95, 5.86, 0.86, 0.54, 0.52, 0.27, 0.38, 0.01, 0.95, 3.09, 14.38, 0.63, 0.46, -0.42, 1.04, 1.01, 1.52, 1.29, 0.67, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/euCWQcrBwPY_filtered.json b/annotations_filtered/euCWQcrBwPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3dd2d70514a95a785f67baee44b5e583ab09d92 --- /dev/null +++ b/annotations_filtered/euCWQcrBwPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [14.0, 14.23], [15.0, 15.38], [16.0, 16.56], [17.0, 131.3]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.49, 0.23, 0.38, 0.56, 114.3]} \ No newline at end of file diff --git a/annotations_filtered/euJyO4E3FzE_filtered.json b/annotations_filtered/euJyO4E3FzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86922ba6d099510a8f44aec19fbb24c841af243f --- /dev/null +++ b/annotations_filtered/euJyO4E3FzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.42], [8.0, 9.39], [11.0, 12.02], [31.0, 34.13], [35.0, 42.77], [47.0, 48.42], [51.0, 50.97], [53.0, 53.2], [58.0, 82.93], [84.0, 85.51], [89.0, 90.86], [91.0, 90.9], [91.0, 93.5], [99.0, 111.45], [114.0, 124.07], [124.0, 130.64], [131.0, 139.24]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 33.36, 45.11, 0.0, 0.0, 0.0, 30.85, 0.0, 0.0, 0.0, 31.27, 31.67, 31.66, 31.11, 31.13], "audiomae_on_audioset": [null, null, null, [["music", 46.61], ["didgeridoo", 16.39], ["speech", 12.84]], [["fly, housefly", 22.1], ["speech", 10.09], ["hum", 9.85]], null, null, null, [["music", 18.7], ["hum", 14.18], ["mains hum", 11.04]], null, null, null, [["music", 25.54], ["throbbing", 21.62], ["hum", 9.42]], [["music", 23.32], ["hum", 17.75], ["speech", 6.72]], [["vehicle", 22.12], ["speech", 8.49], ["car", 7.19]], [["cattle, bovinae", 41.98], ["livestock, farm animals, working animals", 29.57], ["moo", 22.31]], [["music", 27.82], ["speech", 11.5], ["whack, thwack", 7.72]]], "duration": [0.42, 1.39, 1.02, 3.13, 7.77, 1.42, -0.03, 0.2, 24.93, 1.51, 1.86, -0.1, 2.5, 12.45, 10.07, 6.64, 8.24]} \ No newline at end of file diff --git a/annotations_filtered/euffalJGKn4_filtered.json b/annotations_filtered/euffalJGKn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee82d5fce1267f27a52848afff21c93ffa8524dc --- /dev/null +++ b/annotations_filtered/euffalJGKn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.55], [16.0, 16.82], [18.0, 18.05], [21.0, 22.44], [24.0, 23.95], [35.0, 35.85], [41.0, 40.8], [44.0, 69.92], [86.0, 87.45], [89.0, 95.5], [97.0, 114.62], [115.0, 116.18], [124.0, 125.66], [126.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 99.87, 76.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 73.69], ["hum", 3.46], ["speech", 2.25]], null, null, null, null, null, null], "duration": [1.55, 0.82, 0.05, 1.44, -0.05, 0.85, -0.2, 25.92, 1.45, 6.5, 17.62, 1.18, 1.66, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/eug4wbPSykc_filtered.json b/annotations_filtered/eug4wbPSykc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e671d639f4fc68e89026999c2f70fd9c4ef06f9 --- /dev/null +++ b/annotations_filtered/eug4wbPSykc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 68.34], [70.0, 72.86], [73.0, 75.27], [76.0, 85.24], [86.0, 88.77], [90.0, 123.5], [124.0, 123.92]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [85.72, 54.04, 54.56, 52.92, 40.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 23.16], ["music", 15.73], ["mains hum", 11.63]], null, null], "duration": [3.34, 2.86, 2.27, 9.24, 2.77, 33.5, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/euorMDBYxrk_filtered.json b/annotations_filtered/euorMDBYxrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..065f1beddd90d45c25ef3d3a3b27cfd932dc2130 --- /dev/null +++ b/annotations_filtered/euorMDBYxrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.57], [8.0, 9.39], [17.0, 18.42], [20.0, 21.49], [24.0, 24.78], [32.0, 33.22], [41.0, 42.85], [44.0, 46.47], [47.0, 47.88], [86.0, 87.59], [88.0, 89.31], [91.0, 92.16], [101.0, 101.14], [102.0, 102.37], [104.0, 105.38], [111.0, 111.69], [113.0, 114.18], [114.0, 115.75], [116.0, 126.25], [128.0, 127.9], [130.0, 131.72], [139.0, 139.73], [141.0, 141.98], [150.0, 150.33], [152.0, 152.14], [176.0, 177.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.57, 1.39, 1.42, 1.49, 0.78, 1.22, 1.85, 2.47, 0.88, 1.59, 1.31, 1.16, 0.14, 0.37, 1.38, 0.69, 1.18, 1.75, 10.25, -0.1, 1.72, 0.73, 0.98, 0.33, 0.14, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/euvUARojiiI_filtered.json b/annotations_filtered/euvUARojiiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d88fa06eb18dcc4154f9658ef3a9b12ed4a4848 --- /dev/null +++ b/annotations_filtered/euvUARojiiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.71], [14.0, 15.79], [17.0, 18.18], [19.0, 20.6], [21.0, 22.92], [25.0, 25.98], [26.0, 28.81], [29.0, 53.35], [56.0, 57.75], [61.0, 63.91], [64.0, 76.62], [78.0, 80.05], [80.0, 101.49], [105.0, 106.27], [110.0, 122.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 98.8, 0.0, 95.91, 40.62, 55.11, 37.49, 0.0, 30.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 36.18], ["speech", 23.28], ["hum", 9.17]], null, [["music", 37.05], ["speech", 21.52], ["didgeridoo", 14.3]], null, [["music", 15.02], ["outside, rural or natural", 12.9], ["speech", 9.97]]], "duration": [1.71, 1.79, 1.18, 1.6, 1.92, 0.98, 2.81, 24.35, 1.75, 2.91, 12.62, 2.05, 21.49, 1.27, 12.49]} \ No newline at end of file diff --git a/annotations_filtered/ev-4cz3hlr0_filtered.json b/annotations_filtered/ev-4cz3hlr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18219cf8d29420790fc23980bc7ec5fbd0d6a2ec --- /dev/null +++ b/annotations_filtered/ev-4cz3hlr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.44], [7.0, 8.01], [10.0, 10.93], [12.0, 22.05], [23.0, 25.03], [26.0, 27.85], [30.0, 32.05], [34.0, 35.38], [37.0, 37.72], [41.0, 42.31], [48.0, 48.81], [52.0, 53.1], [54.0, 59.54], [61.0, 63.22], [65.0, 65.4], [67.0, 69.96], [72.0, 85.36], [87.0, 87.32]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [35.05, 0.0, 0.0, 93.13, 99.52, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 43.4, 0.0, 51.18, 45.88, 0.0], "audiomae_on_audioset": [[["hum", 19.79], ["music", 8.76], ["insect", 8.22]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.35], ["speech", 17.01], ["hum", 9.19]], null, null, [["hum", 44.46], ["music", 15.7], ["mains hum", 14.05]], null], "duration": [3.44, 1.01, 0.93, 10.05, 2.03, 1.85, 2.05, 1.38, 0.72, 1.31, 0.81, 1.1, 5.54, 2.22, 0.4, 2.96, 13.36, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/ev7an6-CYpc_filtered.json b/annotations_filtered/ev7an6-CYpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32564a8e410f8d8d364364c0560192e31eec05d3 --- /dev/null +++ b/annotations_filtered/ev7an6-CYpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.63], [16.0, 26.54], [29.0, 30.37], [33.0, 36.48], [36.0, 37.03], [38.0, 38.52], [40.0, 40.96], [43.0, 47.28], [48.0, 48.78], [50.0, 62.61], [66.0, 75.29], [78.0, 79.19], [79.0, 80.55], [81.0, 83.07], [85.0, 85.38], [87.0, 86.68], [91.0, 92.25], [96.0, 98.24], [101.0, 103.5], [106.0, 108.33], [109.0, 110.1], [114.0, 114.34], [118.0, 127.53], [130.0, 130.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [87.19, 64.86, 0.0, 56.03, 0.0, 0.0, 0.0, 59.68, 0.0, 37.66, 82.79, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 77.03, 87.0, 94.66, 0.0, 0.0, 35.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 48.3], ["speech", 28.38], ["flute", 3.88]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.71], ["synthesizer", 7.03], ["throbbing", 5.69]], null], "duration": [4.63, 10.54, 1.37, 3.48, 1.03, 0.52, 0.96, 4.28, 0.78, 12.61, 9.29, 1.19, 1.55, 2.07, 0.38, -0.32, 1.25, 2.24, 2.5, 2.33, 1.1, 0.34, 9.53, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/evJPzjgv-2s_filtered.json b/annotations_filtered/evJPzjgv-2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea0c341e0073cf4a677f90cbc6cf074f61ed1ee7 --- /dev/null +++ b/annotations_filtered/evJPzjgv-2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 75.71], [76.0, 83.08], [85.0, 87.88], [89.0, 91.77], [95.0, 98.63], [102.0, 110.93], [117.0, 120.78], [123.0, 123.35], [124.0, 124.51]], "keep_status": [false, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 31.37, 30.42, 30.72, 30.44, 30.4, 31.24, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 26.3], ["motorcycle", 17.75], ["vehicle", 6.36]], [["music", 51.21], ["cacophony", 10.96], ["boing", 4.47]], [["music", 66.43], ["electronic music", 3.75], ["didgeridoo", 3.32]], [["music", 52.42], ["throbbing", 5.59], ["hum", 4.39]], [["music", 65.69], ["throbbing", 3.51], ["foghorn", 1.75]], [["music", 38.6], ["speech", 14.08], ["throbbing", 8.93]], null, null], "duration": [0.71, 7.08, 2.88, 2.77, 3.63, 8.93, 3.78, 0.35, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/evM3k7ep4wo_filtered.json b/annotations_filtered/evM3k7ep4wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6590105c7ad45caff2998a6ebf8d57c54e856088 --- /dev/null +++ b/annotations_filtered/evM3k7ep4wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 82.56], [85.0, 128.16], [132.0, 145.34]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 28.82], "audiomae_on_audioset": [null, null, [["speech", 27.61], ["music", 22.1], ["buzz", 9.26]]], "duration": [77.56, 43.16, 13.34]} \ No newline at end of file diff --git a/annotations_filtered/evQcKvkQCl0_filtered.json b/annotations_filtered/evQcKvkQCl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9d370b9acf92f398ae9d97305f097e1f42f1a9d --- /dev/null +++ b/annotations_filtered/evQcKvkQCl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [3.0, 3.59], [5.0, 5.46], [8.0, 8.92], [16.0, 15.75], [43.0, 44.1], [51.0, 50.9], [53.0, 53.06], [53.0, 53.35], [55.0, 55.0], [63.0, 63.39], [82.0, 82.11], [82.0, 90.15], [91.0, 91.91], [99.0, 100.92], [102.0, 102.57], [104.0, 106.73], [110.0, 110.59], [118.0, 137.57], [140.0, 149.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 97.0, 0.0, 34.52, 29.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.68], ["thump, thud", 7.35], ["reverberation", 4.77]], null, null, null, null, null, [["speech", 31.69], ["music", 15.61], ["whack, thwack", 5.22]], [["music", 78.63], ["didgeridoo", 3.11], ["electronic music", 2.88]]], "duration": [1.17, 0.59, 0.46, 0.92, -0.25, 1.1, -0.1, 0.06, 0.35, 0.0, 0.39, 0.11, 8.15, 0.91, 1.92, 0.57, 2.73, 0.59, 19.57, 9.89]} \ No newline at end of file diff --git a/annotations_filtered/evWlSySuiII_filtered.json b/annotations_filtered/evWlSySuiII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aba13f90e01084406062e60df276cd4bc606c824 --- /dev/null +++ b/annotations_filtered/evWlSySuiII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.43], [9.0, 9.96], [24.0, 24.71], [25.0, 27.14], [30.0, 31.31], [33.0, 33.08], [35.0, 38.64], [42.0, 57.92], [58.0, 57.99], [59.0, 59.73], [61.0, 62.18], [63.0, 63.95], [65.0, 65.67], [67.0, 68.0], [75.0, 75.34], [78.0, 78.56], [81.0, 82.04]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [50.61, 0.0, 0.0, 37.89, 0.0, 0.0, 38.19, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sheep", 19.31], ["bleat", 16.9], ["whale vocalization", 15.81]], null, null, [["speech", 49.21], ["vehicle", 7.19], ["rumble", 6.81]], [["music", 42.83], ["speech", 9.14], ["didgeridoo", 4.17]], null, null, null, null, null, null, null, null, null], "duration": [6.43, 0.96, 0.71, 2.14, 1.31, 0.08, 3.64, 15.92, -0.01, 0.73, 1.18, 0.95, 0.67, 1.0, 0.34, 0.56, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/eveUzWmTxl4_filtered.json b/annotations_filtered/eveUzWmTxl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f89b908fb6c91eb2dd7aea1a0959e2312bfc90c --- /dev/null +++ b/annotations_filtered/eveUzWmTxl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [6.0, 9.15], [11.0, 13.15], [15.0, 24.02], [28.0, 29.02], [30.0, 30.4], [43.0, 50.28], [52.0, 73.9], [75.0, 78.12], [78.0, 78.54], [80.0, 81.11], [93.0, 93.5], [102.0, 102.76], [116.0, 117.14], [118.0, 118.17], [125.0, 125.63], [129.0, 130.08]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.85, 38.45, 0.0, 0.0, 31.94, 90.08, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 60.37], ["sidetone", 4.09], ["sine wave", 3.15]], null, null, [["clang", 13.94], ["hammer", 12.37], ["whack, thwack", 8.49]], null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 3.15, 2.15, 9.02, 1.02, 0.4, 7.28, 21.9, 3.12, 0.54, 1.11, 0.5, 0.76, 1.14, 0.17, 0.63, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/evo1frlMjHQ_filtered.json b/annotations_filtered/evo1frlMjHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55fc6a73d116fb68cb459c9c497d3dc14e4dbc03 --- /dev/null +++ b/annotations_filtered/evo1frlMjHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [3.0, 3.5], [5.0, 5.41], [6.0, 31.19], [33.0, 43.93], [45.0, 50.63], [52.0, 79.64], [80.0, 82.59], [83.0, 83.94], [85.0, 86.1], [87.0, 87.93], [88.0, 88.75], [89.0, 91.4], [94.0, 96.42], [98.0, 98.95], [99.0, 100.48], [101.0, 108.67]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.65, 38.09, 42.88, 31.19, 46.68, 0.0, 0.0, 0.0, 0.0, 56.93, 30.98, 0.0, 0.0, 36.41], "audiomae_on_audioset": [null, null, null, [["music", 25.97], ["synthesizer", 20.45], ["hum", 9.41]], [["synthesizer", 19.57], ["mains hum", 19.57], ["music", 17.83]], [["music", 57.27], ["ambient music", 9.44], ["theremin", 6.52]], [["music", 49.98], ["gong", 20.62], ["ambient music", 10.81]], [["didgeridoo", 21.79], ["sidetone", 21.06], ["busy signal", 17.0]], null, null, null, null, null, [["music", 38.11], ["thunk", 17.0], ["theremin", 5.56]], null, null, [["speech", 48.53], ["music", 29.02], ["musical instrument", 6.04]]], "duration": [0.64, 0.5, 0.41, 25.19, 10.93, 5.63, 27.64, 2.59, 0.94, 1.1, 0.93, 0.75, 2.4, 2.42, 0.95, 1.48, 7.67]} \ No newline at end of file diff --git a/annotations_filtered/ewEreSjPyC4_filtered.json b/annotations_filtered/ewEreSjPyC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5617b56fabc8a321d147fa26f6914c71bec29449 --- /dev/null +++ b/annotations_filtered/ewEreSjPyC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.74], [21.0, 22.0], [23.0, 23.97], [25.0, 26.38], [27.0, 36.27], [39.0, 39.06], [40.0, 41.89], [43.0, 47.7], [48.0, 49.45], [51.0, 74.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 1.0, 0.97, 1.38, 9.27, 0.06, 1.89, 4.7, 1.45, 23.06]} \ No newline at end of file diff --git a/annotations_filtered/ewVwSrVSKS4_filtered.json b/annotations_filtered/ewVwSrVSKS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9543a52791495f3dadc0f42023377147d14931bf --- /dev/null +++ b/annotations_filtered/ewVwSrVSKS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [5.0, 8.41], [11.0, 11.3], [14.0, 15.16], [15.0, 15.57], [18.0, 18.25], [22.0, 22.2], [29.0, 30.54], [31.0, 31.77], [33.0, 36.58], [37.0, 37.54], [40.0, 41.35], [44.0, 45.0], [46.0, 48.07], [50.0, 50.75], [52.0, 55.29], [56.0, 58.5], [61.0, 62.19], [64.0, 65.91], [67.0, 69.06], [70.0, 72.35], [79.0, 80.57], [82.0, 82.7], [84.0, 85.46], [86.0, 87.54], [99.0, 99.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 3.41, 0.3, 1.16, 0.57, 0.25, 0.2, 1.54, 0.77, 3.58, 0.54, 1.35, 1.0, 2.07, 0.75, 3.29, 2.5, 1.19, 1.91, 2.06, 2.35, 1.57, 0.7, 1.46, 1.54, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/ewbUaMvCaYg_filtered.json b/annotations_filtered/ewbUaMvCaYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd7d10210c485a037c05c67b6200f46a37b6ae0e --- /dev/null +++ b/annotations_filtered/ewbUaMvCaYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 72.67]], "keep_status": [false], "silence_prob": [35.39], "audiomae_on_audioset": [[["speech", 61.85], ["breaking", 8.67], ["groan", 7.34]]], "duration": [25.67]} \ No newline at end of file diff --git a/annotations_filtered/ewiNzru8Kek_filtered.json b/annotations_filtered/ewiNzru8Kek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..027878543ab42a34e42227b63bea12b595de78f5 --- /dev/null +++ b/annotations_filtered/ewiNzru8Kek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.98], [7.0, 9.8], [10.0, 10.2], [11.0, 11.85], [14.0, 15.15], [16.0, 16.6], [20.0, 19.94], [20.0, 32.95], [33.0, 33.3], [34.0, 39.18], [41.0, 42.2], [45.0, 62.29], [69.0, 73.41], [77.0, 79.96], [84.0, 89.33], [94.0, 97.61], [98.0, 98.59], [101.0, 103.6], [104.0, 106.56], [108.0, 126.03], [127.0, 127.99], [130.0, 131.85], [134.0, 134.87], [135.0, 137.79], [139.0, 140.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 0.0, 32.34, 0.0, 31.59, 29.99, 36.35, 29.19, 49.27, 0.0, 29.72, 31.56, 31.38, 0.0, 0.0, 0.0, 72.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 63.56], ["whale vocalization", 20.39], ["music", 2.44]], null, [["speech", 47.82], ["boing", 12.44], ["hum", 5.79]], null, [["music", 50.5], ["speech", 14.63], ["didgeridoo", 9.11]], [["mains hum", 40.12], ["hum", 17.59], ["electric shaver, electric razor", 10.13]], [["whale vocalization", 61.01], ["roar", 4.72], ["sound effect", 3.31]], [["hum", 26.72], ["music", 10.61], ["mains hum", 8.02]], [["speech", 50.74], ["cough", 20.71], ["music", 3.64]], null, [["music", 30.12], ["speech", 19.01], ["cattle, bovinae", 11.5]], [["cattle, bovinae", 29.78], ["moo", 18.46], ["livestock, farm animals, working animals", 16.83]], [["speech", 48.08], ["music", 19.28], ["didgeridoo", 8.5]], null, null, null, null, null], "duration": [-0.02, 2.8, 0.2, 0.85, 1.15, 0.6, -0.06, 12.95, 0.3, 5.18, 1.2, 17.29, 4.41, 2.96, 5.33, 3.61, 0.59, 2.6, 2.56, 18.03, 0.99, 1.85, 0.87, 2.79, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/ewkroL1cP_Q_filtered.json b/annotations_filtered/ewkroL1cP_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf6dfe13d68374b6abef54d629f9d26370de0d8 --- /dev/null +++ b/annotations_filtered/ewkroL1cP_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.53], [11.0, 11.87], [15.0, 15.55], [17.0, 20.17], [22.0, 22.33], [26.0, 27.9], [29.0, 29.76], [32.0, 32.59], [43.0, 43.43], [47.0, 48.05], [56.0, 60.56], [61.0, 66.65], [69.0, 70.38], [73.0, 83.52], [84.0, 84.43], [86.0, 100.41], [106.0, 106.69], [113.0, 114.79], [117.0, 117.14], [118.0, 118.45], [123.0, 125.66], [127.0, 130.54], [132.0, 133.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.77, 70.58, 0.0, 87.19, 0.0, 45.82, 0.0, 0.0, 0.0, 0.0, 96.54, 42.02, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 80.76], ["busy signal", 5.84], ["dial tone", 2.46]], null, null, null, null, null, null, null, null, null, null, null, [["radio", 37.46], ["music", 8.83], ["telephone", 5.8]], null, null, null, null, null, [["fart", 56.33], ["hum", 11.07], ["heart sounds, heartbeat", 4.05]], null], "duration": [0.53, 0.87, 0.55, 3.17, 0.33, 1.9, 0.76, 0.59, 0.43, 1.05, 4.56, 5.65, 1.38, 10.52, 0.43, 14.41, 0.69, 1.79, 0.14, 0.45, 2.66, 3.54, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/ewvHk1nM5u0_filtered.json b/annotations_filtered/ewvHk1nM5u0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4748475694fcba6cda25610cc0c05cab155f2a05 --- /dev/null +++ b/annotations_filtered/ewvHk1nM5u0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [9.0, 9.88], [13.0, 13.53], [31.0, 31.82], [39.0, 38.97], [40.0, 40.76], [41.0, 42.43], [46.0, 46.9], [48.0, 49.94], [53.0, 53.72], [55.0, 56.12], [65.0, 66.02], [66.0, 67.41], [73.0, 74.68], [80.0, 80.25], [81.0, 81.09], [83.0, 83.47], [84.0, 83.98], [87.0, 86.71], [87.0, 87.74], [89.0, 90.26], [95.0, 94.81], [95.0, 94.85], [99.0, 99.54], [107.0, 119.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.81], ["musical instrument", 4.8], ["guitar", 4.64]]], "duration": [0.39, 0.88, 0.53, 0.82, -0.03, 0.76, 1.43, 0.9, 1.94, 0.72, 1.12, 1.02, 1.41, 1.68, 0.25, 0.09, 0.47, -0.02, -0.29, 0.74, 1.26, -0.19, -0.15, 0.54, 12.52]} \ No newline at end of file diff --git a/annotations_filtered/ewwKExvkqXQ_filtered.json b/annotations_filtered/ewwKExvkqXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cb436c81483f68b567f3ae5ac4dd54f24f4d3b6 --- /dev/null +++ b/annotations_filtered/ewwKExvkqXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.65], [13.0, 15.4], [16.0, 16.29], [29.0, 41.74], [49.0, 48.96], [51.0, 50.85], [56.0, 56.84], [57.0, 57.87], [65.0, 66.18], [68.0, 69.04], [70.0, 71.31], [72.0, 72.64], [73.0, 78.71], [79.0, 80.33], [84.0, 90.54], [91.0, 91.79], [95.0, 97.34], [99.0, 99.2], [101.0, 102.56], [103.0, 104.45], [106.0, 107.27], [109.0, 110.13], [111.0, 111.84], [113.0, 126.5], [127.0, 126.54], [127.0, 126.57], [127.0, 126.6], [127.0, 126.64], [127.0, 126.67], [127.0, 126.71], [127.0, 126.74], [130.0, 130.64], [133.0, 134.96], [136.0, 137.37], [139.0, 139.75], [141.0, 141.57], [144.0, 145.77], [146.0, 147.72], [148.0, 147.75], [148.0, 147.78], [148.0, 147.82], [148.0, 147.85], [152.0, 152.58], [158.0, 158.73], [159.0, 160.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.25, 0.0, 39.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.04, 0.0, 37.42, 0.0, 35.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 90.5], ["horse", 2.22], ["clip-clop", 1.25]], null, [["speech", 55.22], ["music", 10.43], ["radio", 5.78]], null, null, null, null, null, null, null, null, null, null, [["speech", 25.66], ["music", 12.52], ["radio", 9.74]], null, [["speech", 80.44], ["boing", 2.97], ["sidetone", 2.85]], null, null, null, null, null, null, [["speech", 37.8], ["radio", 28.11], ["fart", 2.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.35, 2.4, 0.29, 12.74, -0.04, -0.15, 0.84, 0.87, 1.18, 1.04, 1.31, 0.64, 5.71, 1.33, 6.54, 0.79, 2.34, 0.2, 1.56, 1.45, 1.27, 1.13, 0.84, 13.5, -0.46, -0.43, -0.4, -0.36, -0.33, -0.29, -0.26, 0.64, 1.96, 1.37, 0.75, 0.57, 1.77, 1.72, -0.25, -0.22, -0.18, -0.15, 0.58, 0.73, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/ex65__9m7f0_filtered.json b/annotations_filtered/ex65__9m7f0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f59abee04a0f251376e2c772d456698a42127d78 --- /dev/null +++ b/annotations_filtered/ex65__9m7f0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.75], [7.0, 11.5], [12.0, 15.48], [18.0, 20.44], [22.0, 25.19], [27.0, 45.39], [47.0, 50.26], [51.0, 53.38], [61.0, 60.83], [61.0, 62.41], [66.0, 66.7], [67.0, 70.41], [71.0, 72.74], [74.0, 74.83], [76.0, 77.52], [81.0, 84.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.93, 89.72, 82.79, 99.92, 98.66, 99.98, 99.88, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 99.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 4.5, 3.48, 2.44, 3.19, 18.39, 3.26, 2.38, -0.17, 1.41, 0.7, 3.41, 1.74, 0.83, 1.52, 3.97]} \ No newline at end of file diff --git a/annotations_filtered/ex6X6rXcXKQ_filtered.json b/annotations_filtered/ex6X6rXcXKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca66496d5d454c2d5e3ca9eff0fcc4069ef69e2b --- /dev/null +++ b/annotations_filtered/ex6X6rXcXKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.72], [9.0, 23.62], [24.0, 24.26], [26.0, 44.05], [46.0, 51.16], [52.0, 74.24], [79.0, 79.54], [81.0, 82.32]], "keep_status": [false, true, false, true, true, true, false, false], "silence_prob": [0.0, 30.61, 0.0, 30.86, 31.1, 30.85, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 36.94], ["vehicle", 8.74], ["siren", 8.15]], null, [["speech", 21.99], ["vehicle", 19.08], ["siren", 17.58]], [["music", 54.69], ["hum", 4.29], ["mains hum", 4.23]], [["music", 43.37], ["vehicle", 10.19], ["skidding", 7.49]], null, null], "duration": [0.72, 14.62, 0.26, 18.05, 5.16, 22.24, 0.54, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/exCuIisMWl0_filtered.json b/annotations_filtered/exCuIisMWl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcca5eebf945aab5c7d407327d029624ac6c78e4 --- /dev/null +++ b/annotations_filtered/exCuIisMWl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.91], [7.0, 8.8], [11.0, 17.02], [19.0, 20.06], [20.0, 20.8], [21.0, 22.71], [24.0, 29.44], [31.0, 32.53], [34.0, 34.92], [35.0, 40.53], [43.0, 48.52], [50.0, 50.75], [51.0, 52.44], [55.0, 56.66], [58.0, 59.53], [61.0, 65.74], [66.0, 68.81], [71.0, 70.98], [71.0, 71.74], [73.0, 74.43], [76.0, 78.27], [78.0, 81.89], [83.0, 83.4], [85.0, 86.05], [86.0, 86.76], [87.0, 87.67], [88.0, 91.0], [92.0, 92.79], [94.0, 93.72], [95.0, 103.52], [104.0, 118.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 100.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 99.21, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.91, 1.8, 6.02, 1.06, 0.8, 1.71, 5.44, 1.53, 0.92, 5.53, 5.52, 0.75, 1.44, 1.66, 1.53, 4.74, 2.81, -0.02, 0.74, 1.43, 2.27, 3.89, 0.4, 1.05, 0.76, 0.67, 3.0, 0.79, -0.28, 8.52, 14.5]} \ No newline at end of file diff --git a/annotations_filtered/exE414Mp-gA_filtered.json b/annotations_filtered/exE414Mp-gA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..024a0c781c63f6617c777bdd77b87290c7a00e17 --- /dev/null +++ b/annotations_filtered/exE414Mp-gA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.23], [11.0, 18.45], [23.0, 76.99], [79.0, 81.73], [82.0, 81.77], [82.0, 81.8], [82.0, 96.94]], "keep_status": [false, false, false, true, false, false, true], "silence_prob": [0.0, 30.7, 0.0, 31.11, 0.0, 0.0, 29.76], "audiomae_on_audioset": [null, [["music", 61.49], ["theremin", 14.0], ["throbbing", 4.75]], null, [["speech", 21.95], ["mains hum", 17.49], ["music", 10.07]], null, null, [["music", 42.38], ["speech", 14.26], ["synthesizer", 7.23]]], "duration": [1.23, 7.45, 53.99, 2.73, -0.23, -0.2, 14.94]} \ No newline at end of file diff --git a/annotations_filtered/exFv7Srgwpk_filtered.json b/annotations_filtered/exFv7Srgwpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75bb211d956f0be33cec4e0c0e151cdfe8c51da3 --- /dev/null +++ b/annotations_filtered/exFv7Srgwpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [11.0, 11.75], [16.0, 15.75], [18.0, 19.4], [25.0, 26.22], [28.0, 28.98], [30.0, 32.93], [46.0, 55.76], [56.0, 60.4], [67.0, 76.94], [81.0, 82.63], [83.0, 84.2], [86.0, 89.46], [94.0, 124.44]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 37.52, 93.76, 54.3, 0.0, 0.0, 96.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 26.13], ["mains hum", 24.48], ["throbbing", 9.54]], [["music", 27.18], ["wind instrument, woodwind instrument", 17.36], ["speech", 11.41]], null, null, null, null, null, null], "duration": [1.5, 0.75, -0.25, 1.4, 1.22, 0.98, 2.93, 9.76, 4.4, 9.94, 1.63, 1.2, 3.46, 30.44]} \ No newline at end of file diff --git a/annotations_filtered/exIGslwFcMI_filtered.json b/annotations_filtered/exIGslwFcMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc686df5bbf4fa36a59672a79123f716cd87d9f --- /dev/null +++ b/annotations_filtered/exIGslwFcMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [2.0, 3.32], [20.0, 21.0], [38.0, 42.06], [46.0, 46.41], [49.0, 50.82], [52.0, 53.6], [56.0, 63.9], [66.0, 66.92], [68.0, 78.14], [79.0, 79.17], [81.0, 82.56], [84.0, 84.57], [90.0, 90.27]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.72, 0.0, 0.0, 0.0, 67.51, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["synthesizer", 20.17], ["didgeridoo", 14.74], ["music", 10.72]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 1.32, 1.0, 4.06, 0.41, 1.82, 1.6, 7.9, 0.92, 10.14, 0.17, 1.56, 0.57, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/exObFY-sHQw_filtered.json b/annotations_filtered/exObFY-sHQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f83cf40a2e9a5a63acfd52a2ce3204c79b1d69c --- /dev/null +++ b/annotations_filtered/exObFY-sHQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 4.75], [12.0, 12.61], [15.0, 16.26], [18.0, 19.6], [23.0, 24.0], [26.0, 28.7], [36.0, 37.88], [41.0, 42.4], [47.0, 47.16], [49.0, 51.02], [53.0, 53.84], [60.0, 60.86], [64.0, 64.3], [66.0, 66.66], [69.0, 70.5], [73.0, 72.81], [73.0, 75.79]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.49, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.32], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 21.36], ["moo", 11.76], ["whale vocalization", 11.75]], null, null, null, null, null, null, null, null, null, null, [["speech", 30.6], ["fly, housefly", 26.7], ["fart", 17.28]]], "duration": [0.5, 1.75, 0.61, 1.26, 1.6, 1.0, 2.7, 1.88, 1.4, 0.16, 2.02, 0.84, 0.86, 0.3, 0.66, 1.5, -0.19, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/ex_KPw6bVwQ_filtered.json b/annotations_filtered/ex_KPw6bVwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c53883d87ccac34ff96c70c7d562696e740862ba --- /dev/null +++ b/annotations_filtered/ex_KPw6bVwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.0], [10.0, 26.47], [33.0, 33.02], [39.0, 41.12], [42.0, 42.6], [44.0, 44.02], [46.0, 46.87], [48.0, 49.38], [50.0, 50.36], [52.0, 52.83], [56.0, 60.22], [61.0, 61.7], [62.0, 62.82], [64.0, 64.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 61.37, 0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.0, 16.47, 0.02, 2.12, 0.6, 0.02, 0.87, 1.38, 0.36, 0.83, 4.22, 0.7, 0.82, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/excK59qpaOA_filtered.json b/annotations_filtered/excK59qpaOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a679aef3dbc4722866f155adfc39aa8dc35c78 --- /dev/null +++ b/annotations_filtered/excK59qpaOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 39.06], [39.0, 39.21], [40.0, 42.6], [44.0, 44.42], [46.0, 47.85], [49.0, 49.33], [51.0, 52.96], [56.0, 58.04], [64.0, 65.04], [67.0, 67.44], [70.0, 70.8], [73.0, 73.58], [75.0, 76.45], [78.0, 79.51], [84.0, 85.38], [89.0, 90.61], [94.0, 94.71], [96.0, 102.34], [106.0, 106.78], [107.0, 107.72], [109.0, 109.31], [110.0, 117.81], [121.0, 122.22], [123.0, 125.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [75.39, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 36.72, 0.0, 35.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 15.47], ["speech", 14.69], ["music", 7.31]], null, [["music", 22.09], ["speech", 11.84], ["throbbing", 9.75]]], "duration": [9.06, 0.21, 2.6, 0.42, 1.85, 0.33, 1.96, 2.04, 1.04, 0.44, 0.8, 0.58, 1.45, 1.51, 1.38, 1.61, 0.71, 6.34, 0.78, 0.72, 0.31, 7.81, 1.22, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/exclwIbllXQ_filtered.json b/annotations_filtered/exclwIbllXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57b4d8a3eae20446b8f09bb04d7c3ecba4244292 --- /dev/null +++ b/annotations_filtered/exclwIbllXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [3.0, 4.16], [9.0, 9.24], [13.0, 13.71], [15.0, 15.52], [16.0, 17.07], [18.0, 18.57], [21.0, 21.12], [25.0, 24.81], [28.0, 28.49], [29.0, 30.28], [31.0, 32.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.16, 0.24, 0.71, 0.52, 1.07, 0.57, 0.12, -0.19, 0.49, 1.28, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/exu61pb5X68_filtered.json b/annotations_filtered/exu61pb5X68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8b9a86c5d14e22ae6742c559888d5dfce3f15cc --- /dev/null +++ b/annotations_filtered/exu61pb5X68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.41], [13.0, 13.51], [15.0, 16.92], [29.0, 29.86], [31.0, 33.18], [43.0, 43.9], [50.0, 51.27], [58.0, 58.65], [71.0, 72.57], [75.0, 75.02], [78.0, 82.75], [84.0, 85.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.68, 0.0, 0.0, 0.0, 0.0, 0.0, 41.12, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 36.63], ["music", 20.23], ["synthesizer", 5.09]], null, null, null, null, null, [["music", 73.85], ["grunt", 3.83], ["synthesizer", 2.56]], null], "duration": [0.41, 0.51, 1.92, 0.86, 2.18, 0.9, 1.27, 0.65, 1.57, 0.02, 4.75, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/eyCCuHC08bY_filtered.json b/annotations_filtered/eyCCuHC08bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5ad4d8ae788cba73887fc164cca1f4dce181738 --- /dev/null +++ b/annotations_filtered/eyCCuHC08bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [2.0, 3.84], [7.0, 7.6], [16.0, 16.23], [26.0, 26.94], [28.0, 30.59], [38.0, 41.39], [44.0, 44.58], [52.0, 53.76], [56.0, 58.75], [74.0, 75.93], [99.0, 101.75], [103.0, 104.79], [106.0, 106.46], [126.0, 126.52], [127.0, 128.46], [130.0, 130.77], [155.0, 156.98], [158.0, 158.26], [167.0, 168.67]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.92, 31.53, 0.0, 0.0, 31.05, 0.0, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 20.86], ["explosion", 12.69], ["burst, pop", 8.53]], [["speech", 71.4], ["explosion", 9.77], ["eruption", 6.64]], null, null, [["speech", 37.08], ["music", 17.71], ["smash, crash", 8.94]], null, [["music", 49.35], ["synthesizer", 7.59], ["effects unit", 5.48]], null, null, null, null, null, null, null, null], "duration": [0.5, 1.84, 0.6, 0.23, 0.94, 2.59, 3.39, 0.58, 1.76, 2.75, 1.93, 2.75, 1.79, 0.46, 0.52, 1.46, 0.77, 1.98, 0.26, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/ezOyoEG6GW8_filtered.json b/annotations_filtered/ezOyoEG6GW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..531a2f3737a91f27e68c2364d92b8b352d2c6f7e --- /dev/null +++ b/annotations_filtered/ezOyoEG6GW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [3.0, 4.09], [5.0, 5.44], [5.0, 5.98], [8.0, 9.05], [11.0, 11.52], [13.0, 14.08], [23.0, 23.68], [27.0, 28.11], [34.0, 35.55], [38.0, 39.24], [44.0, 45.1], [51.0, 52.12], [57.0, 58.43], [66.0, 66.63], [69.0, 69.21], [70.0, 70.44], [72.0, 72.81], [74.0, 76.23], [95.0, 96.08], [97.0, 97.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 1.09, 0.44, 0.98, 1.05, 0.52, 1.08, 0.68, 1.11, 1.55, 1.24, 1.1, 1.12, 1.43, 0.63, 0.21, 0.44, 0.81, 2.23, 1.08, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/ezRPVES1oQs_filtered.json b/annotations_filtered/ezRPVES1oQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e03e4cf14a4028f1922b96031812d8e7dfab105a --- /dev/null +++ b/annotations_filtered/ezRPVES1oQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.54], [32.0, 34.67], [39.0, 41.13], [44.0, 43.7], [46.0, 48.17], [50.0, 50.5], [54.0, 57.72], [61.0, 61.87]], "keep_status": [true, true, false, false, true, false, false, false], "silence_prob": [32.11, 44.23, 47.35, 0.0, 28.78, 0.0, 54.83, 0.0], "audiomae_on_audioset": [[["music", 47.9], ["musical instrument", 10.26], ["timpani", 8.59]], [["music", 55.35], ["musical instrument", 4.85], ["didgeridoo", 4.1]], [["music", 73.66], ["synthesizer", 6.29], ["musical instrument", 5.84]], null, [["music", 29.69], ["gunshot, gunfire", 5.91], ["bang", 4.64]], null, null, null], "duration": [3.54, 2.67, 2.13, -0.3, 2.17, 0.5, 3.72, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/ezj13E-cX9I_filtered.json b/annotations_filtered/ezj13E-cX9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97fd7042e5ab80752b0215b04bea3a8a24133496 --- /dev/null +++ b/annotations_filtered/ezj13E-cX9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 20.39], [23.0, 33.2], [40.0, 63.48], [64.0, 64.42], [66.0, 66.66], [70.0, 72.25], [73.0, 74.48]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [35.49, 32.51, 31.27, 0.0, 0.0, 91.98, 0.0], "audiomae_on_audioset": [[["speech", 65.87], ["screaming", 3.88], ["hum", 3.1]], [["speech", 71.38], ["fireworks", 21.25], ["firecracker", 1.35]], [["vehicle", 10.32], ["hum", 8.97], ["noise", 7.4]], null, null, null, null], "duration": [16.39, 10.2, 23.48, 0.42, 0.66, 2.25, 1.48]} \ No newline at end of file