diff --git a/annotations_filtered/c--eNhRG5B4_filtered.json b/annotations_filtered/c--eNhRG5B4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f5f03944fdb604cf960ece9ba1eab76d1d20b6d --- /dev/null +++ b/annotations_filtered/c--eNhRG5B4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.75], [16.0, 17.24], [21.0, 24.0], [27.0, 27.03], [28.0, 29.71], [33.0, 33.18], [34.0, 34.3], [36.0, 38.08], [38.0, 38.84], [40.0, 40.02], [40.0, 40.66], [42.0, 45.32], [46.0, 46.75], [48.0, 47.97], [52.0, 53.87], [55.0, 57.06], [58.0, 58.99], [61.0, 61.5], [62.0, 64.79], [65.0, 68.23], [71.0, 75.93], [83.0, 86.93], [99.0, 99.99], [114.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 75.55, 42.84, 34.5, 30.4, 0.0, 30.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.76], ["speech", 30.82], ["musical instrument", 4.26]], [["music", 38.03], ["effects unit", 9.21], ["musical instrument", 6.73]], [["music", 69.33], ["effects unit", 4.15], ["musical instrument", 3.77]], null, [["music", 43.41], ["effects unit", 9.97], ["theremin", 5.91]]], "duration": [-0.25, 1.24, 3.0, 0.03, 1.71, 0.18, 0.3, 2.08, 0.84, 0.02, 0.66, 3.32, 0.75, -0.03, 1.87, 2.06, 0.99, 0.5, 2.79, 3.23, 4.93, 3.93, 0.99, 16.59]} \ No newline at end of file diff --git a/annotations_filtered/c-NDI-HvYd4_filtered.json b/annotations_filtered/c-NDI-HvYd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fda6b380a7d562d9c0f370ac52dd62d93009e9e --- /dev/null +++ b/annotations_filtered/c-NDI-HvYd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.95], [20.0, 29.0], [32.0, 51.93], [58.0, 113.16], [116.0, 128.36], [131.0, 131.84]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 30.7, 30.3, 0.0, 29.33, 0.0], "audiomae_on_audioset": [null, [["music", 67.8], ["speech", 8.21], ["musical instrument", 2.94]], [["speech", 38.27], ["buzz", 26.84], ["music", 15.7]], null, [["fly, housefly", 36.74], ["mosquito", 21.11], ["insect", 20.32]], null], "duration": [0.95, 9.0, 19.93, 55.16, 12.36, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/c-ecbGNxEHM_filtered.json b/annotations_filtered/c-ecbGNxEHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06d7ed7ca1f05b9fcce7b7217180fff8156f4132 --- /dev/null +++ b/annotations_filtered/c-ecbGNxEHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.2], [21.0, 22.96], [23.0, 29.19], [35.0, 35.72], [39.0, 39.14], [39.0, 40.53], [41.0, 43.6], [45.0, 45.49], [47.0, 47.95], [60.0, 68.1], [75.0, 75.69], [79.0, 79.73], [81.0, 82.59], [87.0, 91.89], [95.0, 99.23], [101.0, 101.76], [103.0, 103.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.29, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0, 38.05, 34.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 67.49], ["theremin", 7.38], ["ambient music", 6.2]], null, null, null, null, null, null, [["throbbing", 55.09], ["hum", 19.79], ["heart sounds, heartbeat", 7.4]], null, null, null, [["speech", 53.0], ["music", 12.31], ["hum", 5.12]], [["speech", 34.19], ["sidetone", 12.52], ["hum", 6.99]], null, null], "duration": [0.2, 1.96, 6.19, 0.72, 0.14, 1.53, 2.6, 0.49, 0.95, 8.1, 0.69, 0.73, 1.59, 4.89, 4.23, 0.76, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/c-ej3IOxBno_filtered.json b/annotations_filtered/c-ej3IOxBno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c89b8bad5a83574d17b28b6460faa5d0e76ce318 --- /dev/null +++ b/annotations_filtered/c-ej3IOxBno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [3.0, 4.48], [8.0, 8.43], [10.0, 11.2], [12.0, 14.22], [15.0, 16.92], [19.0, 20.61], [22.0, 29.84], [32.0, 32.86]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.4, 1.48, 0.43, 1.2, 2.22, 1.92, 1.61, 7.84, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/c-jOeDA-X0k_filtered.json b/annotations_filtered/c-jOeDA-X0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0e767c6098d9ff92c48b18c993569e0e993e993 --- /dev/null +++ b/annotations_filtered/c-jOeDA-X0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [6.0, 8.02], [9.0, 10.27], [13.0, 15.62], [17.0, 33.62], [35.0, 35.18], [39.0, 39.5], [41.0, 43.31], [44.0, 44.9], [46.0, 50.67], [52.0, 51.7], [55.0, 56.03], [60.0, 66.87], [67.0, 70.11], [74.0, 75.52], [77.0, 77.16], [79.0, 78.78], [80.0, 81.67], [84.0, 84.87], [86.0, 86.27], [91.0, 114.71], [117.0, 117.37], [119.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 99.71, 0.0, 99.44, 41.01, 0.0, 0.0, 35.32, 0.0, 39.64, 0.0, 0.0, 32.96, 36.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 62.67], ["music", 7.16], ["bouncing", 5.57]], null, null, [["didgeridoo", 52.55], ["mains hum", 10.61], ["sidetone", 6.89]], null, [["speech", 23.69], ["music", 22.55], ["mains hum", 10.27]], null, null, [["music", 31.26], ["didgeridoo", 30.99], ["hum", 6.33]], [["didgeridoo", 25.35], ["music", 18.32], ["speech", 15.31]], null, null, null, null, null, null, [["speech", 41.82], ["music", 18.51], ["effects unit", 5.27]], null, null], "duration": [1.01, 2.02, 1.27, 2.62, 16.62, 0.18, 0.5, 2.31, 0.9, 4.67, -0.3, 1.03, 6.87, 3.11, 1.52, 0.16, -0.22, 1.67, 0.87, 0.27, 23.71, 0.37, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/c-tGV96ceBM_filtered.json b/annotations_filtered/c-tGV96ceBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccdd203e5ef5a0b7e69866daf3d60f25c159568f --- /dev/null +++ b/annotations_filtered/c-tGV96ceBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.42], [14.0, 15.53], [16.0, 18.96], [20.0, 21.86], [25.0, 25.95], [32.0, 32.61], [33.0, 33.64], [36.0, 35.92], [39.0, 39.82], [42.0, 43.38], [50.0, 51.44], [52.0, 55.05], [56.0, 56.64], [58.0, 58.5], [60.0, 62.28], [65.0, 65.37], [71.0, 71.19], [71.0, 72.84], [76.0, 76.05], [77.0, 78.06], [83.0, 84.25], [86.0, 98.07], [100.0, 102.24], [104.0, 105.31], [106.0, 106.81], [109.0, 109.53], [111.0, 111.91], [113.0, 114.42], [115.0, 118.66], [119.0, 121.22], [122.0, 134.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [81.35, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 97.22, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.58], ["rumble", 13.13], ["hum", 10.9]], null, null], "duration": [3.42, 1.53, 2.96, 1.86, 0.95, 0.61, 0.64, -0.08, 0.82, 1.38, 1.44, 3.05, 0.64, 0.5, 2.28, 0.37, 0.19, 1.84, 0.05, 1.06, 1.25, 12.07, 2.24, 1.31, 0.81, 0.53, 0.91, 1.42, 3.66, 2.22, 12.64]} \ No newline at end of file diff --git a/annotations_filtered/c-unYxWW6ws_filtered.json b/annotations_filtered/c-unYxWW6ws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85ab3e2308b23273b91842f1e8dd9fad10eafac3 --- /dev/null +++ b/annotations_filtered/c-unYxWW6ws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.02], [9.0, 9.66], [10.0, 13.51], [14.0, 14.96], [16.0, 18.35], [21.0, 23.38], [25.0, 26.2], [27.0, 28.95], [30.0, 30.92], [32.0, 31.95], [33.0, 33.91], [35.0, 41.1], [43.0, 46.47], [48.0, 54.46], [56.0, 57.52], [59.0, 61.69], [65.0, 67.83], [70.0, 71.98], [74.0, 75.63], [85.0, 88.65], [95.0, 99.87], [102.0, 103.52], [105.0, 109.58], [115.0, 119.06], [121.0, 122.32], [129.0, 132.76], [136.0, 138.67], [141.0, 144.51], [146.0, 150.43], [151.0, 152.85], [155.0, 157.08], [159.0, 159.9], [161.0, 166.04], [168.0, 174.8]], "keep_status": [true, false, true, false, true, true, false, false, false, false, false, true, true, true, false, true, true, false, false, true, false, false, false, true, false, true, true, true, true, false, false, false, false, false], "silence_prob": [41.34, 0.0, 39.72, 0.0, 48.31, 42.02, 0.0, 0.0, 0.0, 0.0, 0.0, 46.64, 44.87, 47.05, 0.0, 38.38, 41.32, 0.0, 0.0, 40.02, 38.28, 0.0, 40.99, 46.9, 0.0, 48.23, 39.15, 41.7, 38.84, 0.0, 39.94, 0.0, 36.8, 33.54], "audiomae_on_audioset": [[["hum", 25.59], ["mains hum", 12.82], ["throbbing", 8.37]], null, [["hum", 22.11], ["speech", 19.54], ["whale vocalization", 9.24]], null, [["hum", 35.17], ["throbbing", 11.11], ["music", 9.26]], [["music", 13.88], ["hum", 10.59], ["speech", 10.52]], null, null, null, null, null, [["rumble", 21.42], ["speech", 11.46], ["hum", 7.3]], [["speech", 43.64], ["hum", 13.17], ["rumble", 11.67]], [["music", 53.9], ["musical instrument", 4.2], ["theremin", 2.81]], null, [["music", 55.9], ["hum", 6.92], ["throbbing", 5.41]], [["music", 37.45], ["speech", 17.61], ["hum", 4.22]], null, null, [["music", 36.08], ["speech", 16.53], ["synthesizer", 3.43]], [["music", 61.53], ["ambient music", 7.05], ["harmonic", 4.26]], null, [["music", 50.05], ["ambient music", 16.0], ["whale vocalization", 6.53]], [["speech", 57.09], ["field recording", 6.19], ["rumble", 5.5]], null, [["speech", 16.8], ["fire", 6.47], ["vehicle", 6.14]], [["speech", 25.43], ["music", 21.33], ["hum", 20.62]], [["music", 35.49], ["hum", 7.98], ["electronic music", 5.13]], [["music", 49.43], ["didgeridoo", 5.18], ["speech", 5.13]], null, [["music", 48.16], ["synthesizer", 18.3], ["ambient music", 7.19]], null, [["music", 71.4], ["musical instrument", 3.32], ["gong", 3.0]], [["music", 64.7], ["musical instrument", 5.76], ["guitar", 4.98]]], "duration": [7.02, 0.66, 3.51, 0.96, 2.35, 2.38, 1.2, 1.95, 0.92, -0.05, 0.91, 6.1, 3.47, 6.46, 1.52, 2.69, 2.83, 1.98, 1.63, 3.65, 4.87, 1.52, 4.58, 4.06, 1.32, 3.76, 2.67, 3.51, 4.43, 1.85, 2.08, 0.9, 5.04, 6.8]} \ No newline at end of file diff --git a/annotations_filtered/c-veUs6bPHY_filtered.json b/annotations_filtered/c-veUs6bPHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..156bf62f9590927b939e17f3c47ba6ab03ad34fd --- /dev/null +++ b/annotations_filtered/c-veUs6bPHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [0.0, 7.47], [9.0, 9.39], [12.0, 12.72], [14.0, 16.11], [22.0, 22.72], [24.0, 25.25], [32.0, 32.14], [37.0, 37.77], [38.0, 38.96], [40.0, 40.53], [51.0, 51.8], [52.0, 54.72], [66.0, 67.61], [69.0, 74.68], [76.0, 79.05], [81.0, 81.38], [82.0, 82.43], [83.0, 83.91], [92.0, 94.73], [97.0, 97.56], [103.0, 103.84], [109.0, 110.22], [111.0, 112.51], [113.0, 116.55], [131.0, 131.28]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.93, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.08, 0.0, 33.67, 35.12, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0, 0.0, 0.0, 34.82, 0.0], "audiomae_on_audioset": [null, [["noise", 46.75], ["hum", 6.66], ["whale vocalization", 5.04]], null, null, [["sine wave", 23.79], ["hum", 11.84], ["chirp tone", 8.58]], null, null, null, null, null, null, null, [["hum", 20.66], ["music", 17.31], ["speech", 14.34]], null, [["speech", 44.64], ["hum", 12.75], ["mains hum", 8.95]], [["hum", 45.97], ["mains hum", 19.85], ["throbbing", 12.65]], null, null, null, [["speech", 55.32], ["hum", 8.2], ["bee, wasp, etc.", 5.57]], null, null, null, null, [["hum", 52.14], ["mains hum", 23.69], ["throbbing", 17.08]], null], "duration": [0.3, 7.47, 0.39, 0.72, 2.11, 0.72, 1.25, 0.14, 0.77, 0.96, 0.53, 0.8, 2.72, 1.61, 5.68, 3.05, 0.38, 0.43, 0.91, 2.73, 0.56, 0.84, 1.22, 1.51, 3.55, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/c-zaHGYURv0_filtered.json b/annotations_filtered/c-zaHGYURv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04e23e03757e66bc3a555828265effcd5a1e34c6 --- /dev/null +++ b/annotations_filtered/c-zaHGYURv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [1.0, 1.04], [5.0, 5.97], [11.0, 11.01], [12.0, 21.05], [22.0, 23.21], [28.0, 28.75], [32.0, 36.41], [37.0, 52.0], [54.0, 54.62], [55.0, 56.67], [60.0, 62.29], [64.0, 64.77], [65.0, 76.45], [78.0, 84.28], [91.0, 94.19], [95.0, 96.67], [98.0, 98.9], [101.0, 104.87], [107.0, 106.76], [107.0, 106.83], [107.0, 114.37], [115.0, 115.75], [117.0, 117.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 43.2, 51.5, 0.0, 0.0, 69.61, 0.0, 45.3, 41.98, 61.87, 0.0, 0.0, 62.89, 0.0, 0.0, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 48.17], ["hum", 29.27], ["speech", 4.95]], null, null, null, null, null, [["music", 56.67], ["musical instrument", 4.75], ["marimba, xylophone", 4.21]], [["music", 34.11], ["mains hum", 18.6], ["hum", 17.31]], null, null, null, null, null, null, [["mains hum", 36.41], ["hum", 16.38], ["music", 14.0]], null, null], "duration": [-0.03, 0.04, 0.97, 0.01, 9.05, 1.21, 0.75, 4.41, 15.0, 0.62, 1.67, 2.29, 0.77, 11.45, 6.28, 3.19, 1.67, 0.9, 3.87, -0.24, -0.17, 7.37, 0.75, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/c0-3FQ-_SAg_filtered.json b/annotations_filtered/c0-3FQ-_SAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b12f88e27aac9618c14c29dcf75f7b572eca3ad7 --- /dev/null +++ b/annotations_filtered/c0-3FQ-_SAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [10.0, 11.18], [17.0, 68.39], [69.0, 70.58], [73.0, 77.23], [80.0, 89.04], [93.0, 93.75], [96.0, 120.38], [123.0, 124.38], [129.0, 132.0], [133.0, 137.12], [139.0, 139.36], [140.0, 149.71]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.95, 31.52, 0.0, 29.68, 0.0, 78.38, 53.97, 0.0, 41.03], "audiomae_on_audioset": [null, null, null, null, [["fart", 37.84], ["sound effect", 10.16], ["groan", 9.5]], [["speech", 82.77], ["didgeridoo", 2.49], ["music", 1.61]], null, [["music", 24.27], ["livestock, farm animals, working animals", 15.7], ["speech", 12.7]], null, null, null, null, [["music", 65.3], ["speech", 11.15], ["thunk", 3.98]]], "duration": [0.78, 1.18, 51.39, 1.58, 4.23, 9.04, 0.75, 24.38, 1.38, 3.0, 4.12, 0.36, 9.71]} \ No newline at end of file diff --git a/annotations_filtered/c0JxgKT4jZc_filtered.json b/annotations_filtered/c0JxgKT4jZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5ca9623ea96d590691d92d46bcdc335be75ed45 --- /dev/null +++ b/annotations_filtered/c0JxgKT4jZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 66.31], [68.0, 79.14], [81.0, 83.56]], "keep_status": [false, false, false], "silence_prob": [0.0, 99.1, 98.66], "audiomae_on_audioset": [null, null, null], "duration": [35.31, 11.14, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/c0N60xOU9yk_filtered.json b/annotations_filtered/c0N60xOU9yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..336254599be683c96f79e6d42643d8aa5b430f8b --- /dev/null +++ b/annotations_filtered/c0N60xOU9yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.82], [19.0, 21.14], [26.0, 26.4], [29.0, 29.54], [32.0, 31.7], [38.0, 38.15], [40.0, 41.18], [44.0, 45.37], [51.0, 52.27], [53.0, 54.19], [58.0, 58.04], [59.0, 59.02], [61.0, 61.43], [63.0, 62.78], [68.0, 68.88], [72.0, 72.81], [85.0, 84.69], [88.0, 88.59], [106.0, 106.07], [111.0, 113.14], [114.0, 114.76], [121.0, 120.66], [124.0, 127.13], [129.0, 129.3], [133.0, 133.22], [134.0, 134.32], [139.0, 139.68], [141.0, 141.74], [160.0, 160.3], [163.0, 168.47], [169.0, 172.64], [174.0, 176.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 59.96, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 2.14, 0.4, 0.54, -0.3, 0.15, 1.18, 1.37, 1.27, 1.19, 0.04, 0.02, 0.43, -0.22, 0.88, 0.81, -0.31, 0.59, 0.07, 2.14, 0.76, -0.34, 3.13, 0.3, 0.22, 0.32, 0.68, 0.74, 0.3, 5.47, 3.64, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/c0RlK3VAmzg_filtered.json b/annotations_filtered/c0RlK3VAmzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67ae8b3f6c6f9e4789442fa5c3d1b06e0c11bbb8 --- /dev/null +++ b/annotations_filtered/c0RlK3VAmzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.37], [16.0, 16.11], [17.0, 17.25], [24.0, 24.38], [26.0, 26.4], [34.0, 35.7], [37.0, 40.95], [42.0, 42.92], [53.0, 52.86], [53.0, 61.5], [63.0, 66.09], [68.0, 70.75], [71.0, 71.52], [96.0, 98.19], [106.0, 106.52], [125.0, 126.91]], "keep_status": [true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 49.31, 0.0, 0.0, 33.09, 99.16, 68.54, 0.0, 78.21, 0.0, 0.0], "audiomae_on_audioset": [[["sine wave", 12.59], ["hum", 11.63], ["throbbing", 10.25]], null, null, null, null, null, [["music", 54.09], ["speech", 10.06], ["hum", 4.92]], null, null, [["speech", 23.18], ["fart", 14.34], ["sidetone", 12.2]], null, null, null, null, null, null], "duration": [4.37, 0.11, 0.25, 0.38, 0.4, 1.7, 3.95, 0.92, -0.14, 8.5, 3.09, 2.75, 0.52, 2.19, 0.52, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/c0XTkj3PIWg_filtered.json b/annotations_filtered/c0XTkj3PIWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd6c1b677ba3e1ae3ce44d065e95fe300463fd1 --- /dev/null +++ b/annotations_filtered/c0XTkj3PIWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.22], [22.0, 27.99], [29.0, 29.96], [34.0, 34.87], [36.0, 37.4], [38.0, 39.87], [41.0, 43.34], [45.0, 45.81], [50.0, 53.7], [55.0, 55.73], [56.0, 61.94], [65.0, 64.66], [65.0, 66.61], [67.0, 68.17], [80.0, 80.62], [81.0, 81.48], [83.0, 84.48], [88.0, 87.81], [99.0, 101.78], [103.0, 116.92], [117.0, 126.32], [127.0, 126.71], [129.0, 129.22], [131.0, 131.77], [133.0, 133.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 64.07, 0.0, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 42.6, 48.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.73], ["thunk", 7.88], ["boing", 7.15]], [["music", 61.73], ["hum", 10.22], ["synthesizer", 4.69]], [["music", 35.0], ["speech", 11.13], ["fly, housefly", 7.93]], null, null, null, null], "duration": [0.22, 5.99, 0.96, 0.87, 1.4, 1.87, 2.34, 0.81, 3.7, 0.73, 5.94, -0.34, 1.61, 1.17, 0.62, 0.48, 1.48, -0.19, 2.78, 13.92, 9.32, -0.29, 0.22, 0.77, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/c0wH6YDfCzg_filtered.json b/annotations_filtered/c0wH6YDfCzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e468ccc9afd92f43963ab23e92610a85470327c3 --- /dev/null +++ b/annotations_filtered/c0wH6YDfCzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [8.0, 8.34], [11.0, 11.77], [13.0, 13.83], [15.0, 15.26], [17.0, 28.11], [30.0, 31.41], [35.0, 38.75], [39.0, 48.24], [49.0, 51.06], [58.0, 59.49], [73.0, 80.32], [85.0, 99.13], [103.0, 124.33], [127.0, 127.62], [133.0, 133.78], [138.0, 139.19], [144.0, 145.86], [151.0, 152.44], [157.0, 158.68], [167.0, 168.62]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 47.27, 34.88, 36.3, 0.0, 33.95, 37.24, 38.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 20.05], ["mains hum", 9.61], ["music", 7.84]], [["speech", 57.77], ["noise", 10.01], ["buzz", 8.07]], [["speech", 31.54], ["radio", 14.36], ["fly, housefly", 3.99]], null, [["mains hum", 22.85], ["hum", 19.54], ["buzz", 14.76]], [["music", 49.33], ["theremin", 11.1], ["buzz", 4.6]], [["music", 48.34], ["brass instrument", 13.65], ["wind instrument, woodwind instrument", 6.42]], null, null, null, null, null, null, null], "duration": [0.88, 0.34, 0.77, 0.83, 0.26, 11.11, 1.41, 3.75, 9.24, 2.06, 1.49, 7.32, 14.13, 21.33, 0.62, 0.78, 1.19, 1.86, 1.44, 1.68, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/c17KWinVFss_filtered.json b/annotations_filtered/c17KWinVFss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0af192744d51c149b7855a6543e5b1a767d2b2c3 --- /dev/null +++ b/annotations_filtered/c17KWinVFss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.77], [12.0, 13.88], [15.0, 16.36], [19.0, 20.26], [21.0, 21.24], [22.0, 24.06], [30.0, 30.06], [31.0, 31.46], [34.0, 34.59], [37.0, 38.28], [40.0, 41.96], [43.0, 44.9], [49.0, 81.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.25, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.77, 1.88, 1.36, 1.26, 0.24, 2.06, 0.06, 0.46, 0.59, 1.28, 1.96, 1.9, 32.97]} \ No newline at end of file diff --git a/annotations_filtered/c1EyN9xTK94_filtered.json b/annotations_filtered/c1EyN9xTK94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffac7b7f6d6be6f304c5143003ef0067d00fc619 --- /dev/null +++ b/annotations_filtered/c1EyN9xTK94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.01], [21.0, 21.29], [23.0, 23.92], [25.0, 25.35], [27.0, 27.08], [28.0, 28.73], [30.0, 30.47], [40.0, 43.11], [45.0, 45.23], [50.0, 50.94], [55.0, 55.85], [56.0, 58.82]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 84.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 22.47], ["music", 18.33], ["chirp tone", 15.55]], null, null, null, null], "duration": [0.01, 0.29, 0.92, 0.35, 0.08, 0.73, 0.47, 3.11, 0.23, 0.94, 0.85, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/c1nmARXTuvE_filtered.json b/annotations_filtered/c1nmARXTuvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b52870b11b32f2d6dd8e612b3da21d281e4b88e3 --- /dev/null +++ b/annotations_filtered/c1nmARXTuvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.65], [11.0, 12.63], [18.0, 19.08], [24.0, 29.15], [30.0, 32.61], [37.0, 37.13], [40.0, 42.84], [45.0, 46.41], [52.0, 58.68], [59.0, 62.29], [63.0, 65.4], [72.0, 79.39], [81.0, 84.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.26, 99.98, 0.0, 99.78, 0.0, 100.0, 86.64, 48.91, 93.6, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 17.84], ["fly, housefly", 17.39], ["sine wave", 12.57]], null, null], "duration": [1.65, 1.63, 1.08, 5.15, 2.61, 0.13, 2.84, 1.41, 6.68, 3.29, 2.4, 7.39, 3.59]} \ No newline at end of file diff --git a/annotations_filtered/c2HEnbmtknM_filtered.json b/annotations_filtered/c2HEnbmtknM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7d5c7634b4a8a8a8da57a800a2175bc739f522 --- /dev/null +++ b/annotations_filtered/c2HEnbmtknM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.59], [13.0, 47.44], [49.0, 53.03], [54.0, 62.06], [63.0, 91.03], [93.0, 95.47], [97.0, 98.52], [99.0, 117.32]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [30.56, 0.0, 99.96, 33.13, 31.0, 36.18, 0.0, 31.4], "audiomae_on_audioset": [[["mains hum", 39.47], ["hum", 17.27], ["music", 14.24]], null, null, [["music", 43.25], ["speech", 12.31], ["breaking", 5.26]], [["speech", 46.95], ["music", 12.61], ["hum", 12.6]], [["hum", 33.82], ["music", 21.11], ["throbbing", 15.93]], null, [["speech", 36.14], ["music", 24.38], ["breaking", 11.58]]], "duration": [4.59, 34.44, 4.03, 8.06, 28.03, 2.47, 1.52, 18.32]} \ No newline at end of file diff --git a/annotations_filtered/c2HZzrcEbZc_filtered.json b/annotations_filtered/c2HZzrcEbZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d86435daafe3e2961c65ffca2d21d9a3bc817b7 --- /dev/null +++ b/annotations_filtered/c2HZzrcEbZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [12.0, 13.22], [15.0, 14.61], [17.0, 18.05], [20.0, 21.68], [23.0, 51.44], [54.0, 55.41], [58.0, 67.71], [68.0, 69.16], [70.0, 70.48], [72.0, 73.01], [74.0, 85.35], [92.0, 105.29], [108.0, 109.36], [112.0, 121.76], [126.0, 126.6], [129.0, 136.76], [138.0, 140.83], [142.0, 190.38]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 37.39, 0.0, 0.0, 0.0, 34.72, 34.46, 0.0, 35.98, 0.0, 41.95, 33.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 27.5], ["speech", 24.94], ["whack, thwack", 12.92]], null, [["music", 30.94], ["cattle, bovinae", 15.18], ["livestock, farm animals, working animals", 11.0]], null, null, null, [["music", 56.59], ["hum", 5.55], ["speech", 4.89]], [["music", 80.04], ["throbbing", 2.88], ["didgeridoo", 2.76]], null, [["music", 38.16], ["hum", 13.03], ["throbbing", 8.83]], null, [["speech", 50.54], ["music", 8.39], ["hum", 4.56]], [["vehicle", 19.78], ["music", 17.42], ["car", 6.1]], null], "duration": [0.54, 1.22, -0.39, 1.05, 1.68, 28.44, 1.41, 9.71, 1.16, 0.48, 1.01, 11.35, 13.29, 1.36, 9.76, 0.6, 7.76, 2.83, 48.38]} \ No newline at end of file diff --git a/annotations_filtered/c2TcT9JairA_filtered.json b/annotations_filtered/c2TcT9JairA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f93998e082bb64df2efeae2e48e39c14fcec8037 --- /dev/null +++ b/annotations_filtered/c2TcT9JairA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.5], [15.0, 23.11], [26.0, 25.86], [27.0, 29.0], [29.0, 30.0], [32.0, 32.9], [38.0, 43.44], [48.0, 59.61], [60.0, 60.44], [62.0, 62.04], [65.0, 71.42]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 48.02, 0.0, 46.83, 0.0, 0.0, 58.22, 48.23, 0.0, 0.0, 44.81], "audiomae_on_audioset": [null, [["music", 25.51], ["fly, housefly", 13.93], ["speech", 13.52]], null, [["music", 13.62], ["speech", 12.21], ["musical instrument", 2.22]], null, null, null, [["music", 25.18], ["livestock, farm animals, working animals", 15.53], ["speech", 13.25]], null, null, [["speech", 36.29], ["music", 23.59], ["trombone", 14.77]]], "duration": [0.5, 8.11, -0.14, 2.0, 1.0, 0.9, 5.44, 11.61, 0.44, 0.04, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/c2ecZiVEs70_filtered.json b/annotations_filtered/c2ecZiVEs70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd1d73503fcb92f6f2e298daeb3e0266cf4b8910 --- /dev/null +++ b/annotations_filtered/c2ecZiVEs70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.62], [19.0, 21.44], [23.0, 25.71], [26.0, 100.21], [106.0, 105.97], [113.0, 113.21], [116.0, 125.54], [126.0, 131.73], [132.0, 133.08], [134.0, 134.96], [136.0, 136.65], [138.0, 138.03], [139.0, 140.59], [143.0, 143.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 72.01, 89.36, 0.0, 0.0, 0.0, 48.82, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["telephone bell ringing", 41.71], ["music", 31.33], ["telephone", 7.55]], [["speech", 32.98], ["fart", 12.01], ["hum", 7.26]], null, null, null, null, null, null], "duration": [0.62, 2.44, 2.71, 74.21, -0.03, 0.21, 9.54, 5.73, 1.08, 0.96, 0.65, 0.03, 1.59, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/c2k_kuU84ro_filtered.json b/annotations_filtered/c2k_kuU84ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c9b1bb4c67daddf763a30d3b0b7226615915249 --- /dev/null +++ b/annotations_filtered/c2k_kuU84ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 139.94], [143.0, 147.99], [149.0, 152.39], [154.0, 172.56], [174.0, 182.28]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 29.79, 28.88, 29.07, 28.61], "audiomae_on_audioset": [null, [["music", 21.98], ["rumble", 6.88], ["speech", 6.03]], [["speech", 35.31], ["music", 21.58], ["whip", 14.29]], [["speech", 45.54], ["music", 24.83], ["clang", 5.23]], [["music", 49.74], ["speech", 7.62], ["burst, pop", 2.76]]], "duration": [68.94, 4.99, 3.39, 18.56, 8.28]} \ No newline at end of file diff --git a/annotations_filtered/c2tWZFAL5t4_filtered.json b/annotations_filtered/c2tWZFAL5t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8bb88010f4da1f7a9417490786ebcfc736b1e6 --- /dev/null +++ b/annotations_filtered/c2tWZFAL5t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 12.06], [12.0, 12.45], [14.0, 55.05], [58.0, 82.75], [85.0, 85.19], [87.0, 101.61], [105.0, 113.81], [115.0, 115.87], [124.0, 124.73], [126.0, 126.01], [130.0, 130.94], [132.0, 150.7], [151.0, 163.7]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [29.78, 0.0, 0.0, 30.28, 0.0, 30.1, 31.12, 0.0, 0.0, 0.0, 0.0, 30.05, 30.54], "audiomae_on_audioset": [[["music", 47.17], ["synthesizer", 11.08], ["theremin", 10.78]], null, null, [["music", 75.19], ["musical instrument", 10.03], ["didgeridoo", 4.94]], null, [["music", 26.09], ["siren", 8.72], ["didgeridoo", 7.72]], [["music", 52.97], ["didgeridoo", 29.08], ["musical instrument", 4.06]], null, null, null, null, [["music", 37.94], ["didgeridoo", 33.06], ["musical instrument", 8.68]], [["music", 57.31], ["hum", 7.24], ["throbbing", 7.17]]], "duration": [10.06, 0.45, 41.05, 24.75, 0.19, 14.61, 8.81, 0.87, 0.73, 0.01, 0.94, 18.7, 12.7]} \ No newline at end of file diff --git a/annotations_filtered/c35RsjYzAhY_filtered.json b/annotations_filtered/c35RsjYzAhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6be79a0ec064ebbd2c21e65a9bd5dde9641a7241 --- /dev/null +++ b/annotations_filtered/c35RsjYzAhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [19.0, 19.84], [25.0, 25.98], [28.0, 29.07], [36.0, 36.12], [43.0, 45.01]], "keep_status": [true, false, false, false, false, true], "silence_prob": [35.86, 0.0, 0.0, 0.0, 0.0, 33.4], "audiomae_on_audioset": [[["hum", 25.92], ["mains hum", 24.36], ["speech", 17.95]], null, null, null, null, [["fly, housefly", 13.35], ["mosquito", 7.66], ["crowd", 6.98]]], "duration": [2.21, 0.84, 0.98, 1.07, 0.12, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/c38HJR-9vhU_filtered.json b/annotations_filtered/c38HJR-9vhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b06d20b9cd5d71fcd43b99da4d64cc190b8ffa --- /dev/null +++ b/annotations_filtered/c38HJR-9vhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.56], [34.0, 39.78], [41.0, 41.49], [43.0, 44.31], [45.0, 50.82], [52.0, 52.47], [54.0, 68.15], [70.0, 73.16], [73.0, 75.15], [77.0, 77.85], [79.0, 87.79], [90.0, 89.85], [91.0, 92.45], [95.0, 94.58], [95.0, 96.9], [99.0, 99.64], [103.0, 104.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 0.0, 99.98, 0.0, 99.85, 93.13, 100.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 5.78, 0.49, 1.31, 5.82, 0.47, 14.15, 3.16, 2.15, 0.85, 8.79, -0.15, 1.45, -0.42, 1.9, 0.64, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/c3nJu9SBkis_filtered.json b/annotations_filtered/c3nJu9SBkis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebafc9f409be035e6c52f63161cc645860206b2 --- /dev/null +++ b/annotations_filtered/c3nJu9SBkis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 5.21], [8.0, 8.23], [9.0, 10.59], [11.0, 16.5], [21.0, 22.5], [24.0, 24.17], [25.0, 25.59], [28.0, 30.13], [32.0, 37.91], [46.0, 47.46], [49.0, 49.32], [53.0, 52.83], [54.0, 54.36], [56.0, 56.3], [62.0, 62.36], [67.0, 72.72], [75.0, 75.96], [77.0, 77.26], [87.0, 94.12], [95.0, 95.3], [96.0, 97.61], [100.0, 107.37], [115.0, 114.98], [119.0, 135.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 44.43, 0.0, 0.0, 35.49, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 86.58], ["knock", 1.77], ["hands", 1.49]], null, null, [["speech", 71.1], ["knock", 7.38], ["thunk", 2.51]], null, null, [["speech", 69.89], ["thunk", 10.47], ["whack, thwack", 5.11]], null, null], "duration": [0.29, 0.21, 0.23, 1.59, 5.5, 1.5, 0.17, 0.59, 2.13, 5.91, 1.46, 0.32, -0.17, 0.36, 0.3, 0.36, 5.72, 0.96, 0.26, 7.12, 0.3, 1.61, 7.37, -0.02, 16.45]} \ No newline at end of file diff --git a/annotations_filtered/c3uOWTAuaTQ_filtered.json b/annotations_filtered/c3uOWTAuaTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0339d3c2e97cc18ad4c3ddb056d67edd70192ffa --- /dev/null +++ b/annotations_filtered/c3uOWTAuaTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.94], [14.0, 15.43], [26.0, 25.71], [35.0, 35.4]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.94, 1.43, -0.29, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/c3vmsUcknhY_filtered.json b/annotations_filtered/c3vmsUcknhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32b32cc0fc1f98d91dca3466c426a7726b1469f4 --- /dev/null +++ b/annotations_filtered/c3vmsUcknhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.25], [20.0, 20.43], [22.0, 22.72], [23.0, 31.31], [32.0, 37.44], [38.0, 39.36], [40.0, 40.19], [42.0, 44.88], [48.0, 66.78], [67.0, 66.95], [67.0, 87.51], [88.0, 107.45], [109.0, 108.99], [109.0, 118.54], [121.0, 122.91], [124.0, 125.27]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [33.3, 0.0, 0.0, 29.0, 28.93, 0.0, 0.0, 28.91, 31.42, 0.0, 29.01, 28.44, 0.0, 28.48, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 25.33], ["didgeridoo", 22.78], ["music", 15.84]], null, null, [["music", 48.23], ["speech", 8.63], ["buzz", 4.19]], [["music", 54.86], ["throbbing", 9.21], ["hum", 7.22]], null, null, [["music", 50.5], ["throbbing", 12.26], ["hum", 4.28]], [["music", 51.75], ["didgeridoo", 10.53], ["musical instrument", 7.95]], null, [["music", 45.51], ["throbbing", 25.0], ["didgeridoo", 6.0]], [["music", 38.42], ["speech", 25.6], ["hum", 6.28]], null, [["music", 31.53], ["speech", 15.19], ["buzz", 9.57]], null, null], "duration": [5.25, 0.43, 0.72, 8.31, 5.44, 1.36, 0.19, 2.88, 18.78, -0.05, 20.51, 19.45, -0.01, 9.54, 1.91, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/c3zRfKmcqv8_filtered.json b/annotations_filtered/c3zRfKmcqv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..546efafbaee6fe3946eb612740772013060dbd4e --- /dev/null +++ b/annotations_filtered/c3zRfKmcqv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.46], [15.0, 15.03], [19.0, 19.5], [21.0, 21.36], [23.0, 23.99], [36.0, 39.28], [41.0, 40.95], [42.0, 43.61], [44.0, 69.94], [73.0, 73.6], [81.0, 81.21], [83.0, 83.27], [86.0, 91.93], [94.0, 96.97], [98.0, 99.91], [101.0, 104.63], [107.0, 107.5], [108.0, 117.1], [121.0, 122.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 84.25, 56.7, 0.0, 54.76, 0.0, 37.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 30.47], ["speech", 13.1], ["livestock, farm animals, working animals", 9.07]], null], "duration": [1.46, 0.03, 0.5, 0.36, 0.99, 3.28, -0.05, 1.61, 25.94, 0.6, 0.21, 0.27, 5.93, 2.97, 1.91, 3.63, 0.5, 9.1, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/c4Wls5pZlxQ_filtered.json b/annotations_filtered/c4Wls5pZlxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19ab761f54790a3682a33314658b7569014a3849 --- /dev/null +++ b/annotations_filtered/c4Wls5pZlxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.55], [23.0, 27.09], [27.0, 27.55], [31.0, 34.99], [37.0, 37.77], [38.0, 42.38], [46.0, 49.1], [55.0, 57.94], [60.0, 68.22], [71.0, 71.22], [74.0, 97.55], [98.0, 99.28], [99.0, 105.53], [106.0, 106.37], [107.0, 110.83], [115.0, 115.33], [116.0, 118.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.65, 82.43, 0.0, 96.77, 0.0, 62.07, 82.61, 86.64, 70.86, 0.0, 62.99, 0.0, 52.51, 0.0, 74.13, 0.0, 94.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.55, 4.09, 0.55, 3.99, 0.77, 4.38, 3.1, 2.94, 8.22, 0.22, 23.55, 1.28, 6.53, 0.37, 3.83, 0.33, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/c4X58OjlVPo_filtered.json b/annotations_filtered/c4X58OjlVPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d7dac749355dba8947bec1610b61e809fbb5221 --- /dev/null +++ b/annotations_filtered/c4X58OjlVPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 6.13], [11.0, 10.89], [24.0, 24.78], [30.0, 29.88], [31.0, 32.09], [33.0, 33.44], [35.0, 34.75], [41.0, 40.78], [43.0, 43.58], [45.0, 45.22], [47.0, 51.66], [56.0, 57.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 0.13, -0.11, 0.78, -0.12, 1.09, 0.44, -0.25, -0.22, 0.58, 0.22, 4.66, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/c4ibjfBu1IY_filtered.json b/annotations_filtered/c4ibjfBu1IY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70e82b13f3e91b1e744f72aca9733fa64752f9e2 --- /dev/null +++ b/annotations_filtered/c4ibjfBu1IY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [4.0, 3.84], [4.0, 7.01], [9.0, 9.58], [10.0, 12.46], [13.0, 15.58], [17.0, 31.99], [35.0, 44.02], [45.0, 45.37], [53.0, 54.73], [55.0, 61.82], [67.0, 68.67], [69.0, 76.54], [79.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.58, 0.0, 53.78, 73.21, 71.87, 50.86, 0.0, 0.0, 28.22, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.69], ["speech", 25.37], ["electric shaver, electric razor", 8.05]], null, null, null, null, null, null, null, [["speech", 45.99], ["music", 18.47], ["vehicle", 14.47]], null, [["speech", 50.68], ["music", 23.46], ["mains hum", 7.97]], null], "duration": [-0.07, -0.16, 3.01, 0.58, 2.46, 2.58, 14.99, 9.02, 0.37, 1.73, 6.82, 1.67, 7.54, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/c4ux2NclHoE_filtered.json b/annotations_filtered/c4ux2NclHoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b381cbc044fc88cbaf8430627f0efd647d39d7de --- /dev/null +++ b/annotations_filtered/c4ux2NclHoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.44], [14.0, 50.55], [51.0, 50.85], [58.0, 60.22], [65.0, 82.75], [84.0, 88.64]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.22, 35.59, 33.61], "audiomae_on_audioset": [null, null, null, [["music", 38.86], ["whip", 6.86], ["speech", 5.02]], [["music", 64.36], ["effects unit", 8.35], ["synthesizer", 3.64]], [["music", 72.25], ["didgeridoo", 3.64], ["musical instrument", 3.57]]], "duration": [0.44, 36.55, -0.15, 2.22, 17.75, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/c4w-IE-Hsqc_filtered.json b/annotations_filtered/c4w-IE-Hsqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93feea8c3d6f8c523ef0858f2462cbba93be700f --- /dev/null +++ b/annotations_filtered/c4w-IE-Hsqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.3], [35.0, 35.45], [39.0, 39.85], [51.0, 53.01], [56.0, 55.97], [63.0, 71.68], [72.0, 72.5], [74.0, 74.07], [79.0, 82.44], [83.0, 83.2], [84.0, 84.69], [92.0, 93.07], [94.0, 95.4], [100.0, 100.04], [112.0, 112.68], [114.0, 114.98], [116.0, 116.92], [120.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.44, 0.0, 65.2, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.45, 0.85, 2.01, -0.03, 8.68, 0.5, 0.07, 3.44, 0.2, 0.69, 1.07, 1.4, 0.04, 0.68, 0.98, 0.92, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/c5BJJbtFP4E_filtered.json b/annotations_filtered/c5BJJbtFP4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b1fa20a29b188efe5678f822da19d959a1bad06 --- /dev/null +++ b/annotations_filtered/c5BJJbtFP4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [5.0, 9.0], [10.0, 10.37], [12.0, 32.78], [36.0, 37.08], [40.0, 42.63], [48.0, 48.37], [56.0, 64.44], [70.0, 92.03], [97.0, 101.17], [104.0, 104.52], [106.0, 108.36], [120.0, 125.32]], "keep_status": [false, true, false, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 36.9, 0.0, 30.83, 0.0, 30.26, 0.0, 31.03, 30.74, 30.93, 0.0, 29.55, 30.39], "audiomae_on_audioset": [null, [["music", 19.71], ["cattle, bovinae", 18.37], ["moo", 15.89]], null, [["music", 53.77], ["cattle, bovinae", 10.64], ["crowd", 6.05]], null, [["moo", 24.43], ["speech", 22.6], ["cattle, bovinae", 18.32]], null, [["music", 47.46], ["livestock, farm animals, working animals", 13.79], ["cattle, bovinae", 10.33]], [["music", 34.75], ["cattle, bovinae", 8.31], ["crowd", 6.59]], [["music", 34.37], ["speech", 26.23], ["crowd", 3.53]], null, [["speech", 20.44], ["crowd", 19.14], ["cheering", 18.39]], [["cattle, bovinae", 45.24], ["moo", 27.05], ["livestock, farm animals, working animals", 15.56]]], "duration": [0.24, 4.0, 0.37, 20.78, 1.08, 2.63, 0.37, 8.44, 22.03, 4.17, 0.52, 2.36, 5.32]} \ No newline at end of file diff --git a/annotations_filtered/c5Re3lGYUA0_filtered.json b/annotations_filtered/c5Re3lGYUA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71c62e2bc7a369f11bad80a6dde17847b51bba17 --- /dev/null +++ b/annotations_filtered/c5Re3lGYUA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [5.0, 5.34], [7.0, 21.76], [22.0, 33.67], [39.0, 86.85], [87.0, 88.59], [91.0, 112.78], [113.0, 115.94], [119.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.63, 65.44, 0.0, 0.0, 73.97, 91.64, 65.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.34, 14.76, 11.67, 47.85, 1.59, 21.78, 2.94, 3.98]} \ No newline at end of file diff --git a/annotations_filtered/c5WfxwnLlLU_filtered.json b/annotations_filtered/c5WfxwnLlLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5e9d323438312e04ec00aa3b1bd9477d9ead54 --- /dev/null +++ b/annotations_filtered/c5WfxwnLlLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.78], [30.0, 32.37]], "keep_status": [false, true], "silence_prob": [0.0, 36.11], "audiomae_on_audioset": [null, [["music", 11.9], ["explosion", 11.49], ["eruption", 9.88]]], "duration": [-0.22, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/c5ZiiE8fyGk_filtered.json b/annotations_filtered/c5ZiiE8fyGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b1f3530ebc34b6c97a8e721c39520af923b84d8 --- /dev/null +++ b/annotations_filtered/c5ZiiE8fyGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [7.0, 7.3], [8.0, 8.18], [9.0, 10.15], [12.0, 12.87], [14.0, 15.38], [24.0, 24.81], [26.0, 27.18], [28.0, 29.54], [34.0, 34.96], [36.0, 37.45], [38.0, 38.8], [42.0, 43.17], [45.0, 45.54], [47.0, 47.8], [48.0, 48.03], [52.0, 51.95], [54.0, 55.71], [57.0, 57.57], [62.0, 62.07], [73.0, 73.47], [89.0, 88.7], [93.0, 94.86], [103.0, 103.4], [105.0, 107.28], [108.0, 109.02], [110.0, 111.57], [115.0, 116.13], [120.0, 121.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.3, 0.18, 1.15, 0.87, 1.38, 0.81, 1.18, 1.54, 0.96, 1.45, 0.8, 1.17, 0.54, 0.8, 0.03, -0.05, 1.71, 0.57, 0.07, 0.47, -0.3, 1.86, 0.4, 2.28, 1.02, 1.57, 1.13, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/c5mAaBl_qqk_filtered.json b/annotations_filtered/c5mAaBl_qqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b893f44ee980a3af4f6e8848469889ddd56065 --- /dev/null +++ b/annotations_filtered/c5mAaBl_qqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [5.0, 12.48], [13.0, 13.74], [14.0, 15.13], [16.0, 16.93], [18.0, 20.53], [22.0, 62.19], [63.0, 63.54], [64.0, 86.48], [87.0, 95.44], [97.0, 130.86], [134.0, 134.49], [135.0, 136.92], [138.0, 139.16], [142.0, 144.49], [148.0, 151.17], [152.0, 152.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.78, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 46.72, 46.15, 0.0, 0.0, 0.0, 0.0, 71.57, 52.45, 0.0], "audiomae_on_audioset": [null, [["music", 57.93], ["hum", 10.57], ["electronic music", 6.1]], null, null, null, [["hum", 31.19], ["mains hum", 16.52], ["music", 9.82]], null, null, [["speech", 53.35], ["music", 24.4], ["hum", 6.97]], [["hum", 36.72], ["throbbing", 35.2], ["music", 8.61]], null, null, null, null, null, null, null], "duration": [1.52, 7.48, 0.74, 1.13, 0.93, 2.53, 40.19, 0.54, 22.48, 8.44, 33.86, 0.49, 1.92, 1.16, 2.49, 3.17, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/c5zKpr5gmgk_filtered.json b/annotations_filtered/c5zKpr5gmgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22e2c40a2bdfb0661f7b8f0eeb8d92d3d4350fc0 --- /dev/null +++ b/annotations_filtered/c5zKpr5gmgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [12.0, 14.94], [15.0, 15.89], [22.0, 23.43], [24.0, 28.49], [29.0, 29.51], [30.0, 29.62], [33.0, 33.76], [49.0, 49.72], [51.0, 52.17], [57.0, 58.33], [67.0, 67.27], [71.0, 70.75], [82.0, 85.82]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.53, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71], "audiomae_on_audioset": [null, null, null, null, [["music", 37.51], ["noise", 15.79], ["whale vocalization", 9.7]], null, null, null, null, null, null, null, null, null], "duration": [1.07, 2.94, 0.89, 1.43, 4.49, 0.51, -0.38, 0.76, 0.72, 1.17, 1.33, 0.27, -0.25, 3.82]} \ No newline at end of file diff --git a/annotations_filtered/c6XHLe94SJA_filtered.json b/annotations_filtered/c6XHLe94SJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4d5a19e8f004b1f1db0cf4ee686f188973b9927 --- /dev/null +++ b/annotations_filtered/c6XHLe94SJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [3.0, 41.69], [44.0, 46.68], [49.0, 50.23], [51.0, 51.95], [53.0, 60.29], [62.0, 96.65]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 31.38, 0.0, 0.0, 33.96, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 22.04], ["hum", 19.43], ["eruption", 7.3]], null, null, [["hum", 33.44], ["music", 24.75], ["mains hum", 13.65]], null], "duration": [0.05, 38.69, 2.68, 1.23, 0.95, 7.29, 34.65]} \ No newline at end of file diff --git a/annotations_filtered/c6dmj-WpTW4_filtered.json b/annotations_filtered/c6dmj-WpTW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e612f85eed45c408c553ad08310281043ba9e655 --- /dev/null +++ b/annotations_filtered/c6dmj-WpTW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.68], [11.0, 13.9], [15.0, 20.92], [22.0, 26.84], [27.0, 27.85], [30.0, 30.97], [34.0, 38.82], [40.0, 40.34], [42.0, 42.09], [43.0, 44.05], [54.0, 54.92], [56.0, 57.42], [61.0, 62.5], [64.0, 69.04], [73.0, 74.06], [77.0, 108.36], [111.0, 111.6], [112.0, 114.27], [115.0, 115.77], [116.0, 117.8], [119.0, 124.55]], "keep_status": [false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [55.25, 44.84, 47.86, 35.71, 0.0, 0.0, 42.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.69, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 40.43], "audiomae_on_audioset": [null, [["speech", 12.84], ["bee, wasp, etc.", 8.07], ["hum", 7.58]], [["bee, wasp, etc.", 19.8], ["fly, housefly", 16.44], ["mains hum", 11.21]], [["animal", 13.88], ["speech", 13.75], ["dog", 10.47]], null, null, [["speech", 54.53], ["hum", 4.59], ["sidetone", 4.43]], null, null, null, null, null, null, [["whistling", 50.28], ["music", 15.54], ["whistle", 10.43]], null, null, null, [["mosquito", 18.38], ["fart", 14.52], ["fly, housefly", 14.24]], null, null, [["hum", 39.79], ["speech", 28.42], ["mains hum", 9.35]]], "duration": [4.68, 2.9, 5.92, 4.84, 0.85, 0.97, 4.82, 0.34, 0.09, 1.05, 0.92, 1.42, 1.5, 5.04, 1.06, 31.36, 0.6, 2.27, 0.77, 1.8, 5.55]} \ No newline at end of file diff --git a/annotations_filtered/c6ik-AA87Uo_filtered.json b/annotations_filtered/c6ik-AA87Uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d883b80f6618eaf301936bf366b3bd22ef6d85b2 --- /dev/null +++ b/annotations_filtered/c6ik-AA87Uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.53], [38.0, 38.79], [42.0, 42.58], [49.0, 49.33], [55.0, 55.32], [59.0, 60.24], [63.0, 69.89], [72.0, 72.52], [75.0, 75.34], [76.0, 77.28], [82.0, 82.95], [94.0, 94.91], [98.0, 98.32]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 9.32], ["animal", 9.01], ["cattle, bovinae", 7.78]], null, null, null, null, null, null], "duration": [1.53, 0.79, 0.58, 0.33, 0.32, 1.24, 6.89, 0.52, 0.34, 1.28, 0.95, 0.91, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/c6mLa5_GvCQ_filtered.json b/annotations_filtered/c6mLa5_GvCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532d0bbd83848374c55253097108fa2f2070a5f0 --- /dev/null +++ b/annotations_filtered/c6mLa5_GvCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.07], [12.0, 14.39], [28.0, 39.63], [45.0, 44.71], [49.0, 49.84], [54.0, 54.35], [63.0, 64.3], [65.0, 65.82], [71.0, 71.27], [76.0, 76.76], [80.0, 79.84], [80.0, 80.0], [80.0, 80.05], [102.0, 104.72], [112.0, 116.56], [126.0, 125.95], [126.0, 126.99], [129.0, 129.37], [130.0, 131.14], [135.0, 135.7], [146.0, 146.53], [156.0, 156.61], [165.0, 168.02], [169.0, 170.29], [172.0, 172.13], [178.0, 179.1]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.95, 44.2, 30.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.37], ["mains hum", 15.96], ["hum", 15.43]], [["music", 52.07], ["throbbing", 4.37], ["hum", 4.32]], [["music", 63.91], ["animal", 6.16], ["hum", 4.94]], null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 53.23], ["moo", 20.08], ["cattle, bovinae", 16.98]], [["speech", 44.66], ["music", 9.55], ["noise", 5.69]], null, null, null, null, null, null, null, [["mains hum", 31.62], ["hum", 28.64], ["speech", 16.24]], null, null, null], "duration": [7.07, 2.39, 11.63, -0.29, 0.84, 0.35, 1.3, 0.82, 0.27, 0.76, -0.16, 0.0, 0.05, 2.72, 4.56, -0.05, 0.99, 0.37, 1.14, 0.7, 0.53, 0.61, 3.02, 1.29, 0.13, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/c7-u-fyUSkM_filtered.json b/annotations_filtered/c7-u-fyUSkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3fc7e683ace785c03a80322ea82f9b45a86818b --- /dev/null +++ b/annotations_filtered/c7-u-fyUSkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [5.0, 8.92], [10.0, 10.91], [12.0, 12.65], [15.0, 15.4], [17.0, 47.02], [48.0, 51.0], [51.0, 52.15], [54.0, 54.38], [55.0, 59.66], [60.0, 70.04], [71.0, 73.38], [77.0, 81.36], [82.0, 82.97], [85.0, 91.34], [92.0, 95.49], [97.0, 98.05]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 60.89, 46.94, 79.07, 65.67, 0.0, 56.18, 56.63, 0.0], "audiomae_on_audioset": [null, [["speech", 32.27], ["hum", 16.64], ["rumble", 13.98]], null, null, null, null, [["wail, moan", 28.6], ["animal", 18.24], ["speech", 16.21]], null, null, null, [["speech", 72.24], ["beatboxing", 1.96], ["fart", 1.52]], null, null, null, null, null, null], "duration": [1.62, 3.92, 0.91, 0.65, 0.4, 30.02, 3.0, 1.15, 0.38, 4.66, 10.04, 2.38, 4.36, 0.97, 6.34, 3.49, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/c77JrXbqqV0_filtered.json b/annotations_filtered/c77JrXbqqV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0138a8b0356db23702e4f029dce53faffe3016bc --- /dev/null +++ b/annotations_filtered/c77JrXbqqV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [7.0, 7.59], [9.0, 9.17], [10.0, 10.99], [15.0, 15.03], [18.0, 18.37], [20.0, 21.19], [22.0, 22.69], [23.0, 23.79], [26.0, 26.64], [31.0, 30.86], [32.0, 32.27], [32.0, 32.46], [32.0, 35.28], [38.0, 37.98], [40.0, 40.76], [42.0, 41.96], [43.0, 43.34], [44.0, 45.87], [51.0, 54.9], [56.0, 56.94], [60.0, 60.91], [64.0, 65.3], [74.0, 74.16], [76.0, 77.68], [91.0, 92.01], [110.0, 111.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.17], ["sidetone", 27.68], ["hum", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 0.59, 0.17, 0.99, 0.03, 0.37, 1.19, 0.69, 0.79, 0.64, -0.14, 0.27, 0.46, 3.28, -0.02, 0.76, -0.04, 0.34, 1.87, 3.9, 0.94, 0.91, 1.3, 0.16, 1.68, 1.01, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/c7AescgZzEg_filtered.json b/annotations_filtered/c7AescgZzEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6a086a382437f430a35df2bbcadee7ef22dc579 --- /dev/null +++ b/annotations_filtered/c7AescgZzEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.88], [14.0, 19.8], [36.0, 36.59], [37.0, 37.13], [48.0, 49.92], [51.0, 58.21], [58.0, 58.41], [59.0, 76.17], [77.0, 78.22], [79.0, 79.64], [87.0, 87.05], [92.0, 91.69], [97.0, 97.39], [98.0, 98.91], [100.0, 101.22], [102.0, 102.12], [105.0, 106.73], [109.0, 108.92], [116.0, 116.95], [118.0, 119.75], [125.0, 129.66], [132.0, 133.96], [137.0, 137.79], [141.0, 143.68], [144.0, 145.32], [152.0, 154.63], [155.0, 155.73], [163.0, 165.64], [166.0, 168.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.37, 94.07, 0.0, 0.0, 0.0, 51.28, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 92.64, 0.0, 99.85, 0.0, 99.87, 98.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.88, 5.8, 0.59, 0.13, 1.92, 7.21, 0.41, 17.17, 1.22, 0.64, 0.05, -0.31, 0.39, 0.91, 1.22, 0.12, 1.73, -0.08, 0.95, 1.75, 4.66, 1.96, 0.79, 2.68, 1.32, 2.63, 0.73, 2.64, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/c7RyGNzyGB4_filtered.json b/annotations_filtered/c7RyGNzyGB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0998102c58dab7c232f57a1bc34c3619e3e916c --- /dev/null +++ b/annotations_filtered/c7RyGNzyGB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 62.11], [63.0, 103.0], [104.0, 104.77], [106.0, 112.45]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 35.28], "audiomae_on_audioset": [null, null, null, [["thunk", 31.03], ["music", 24.41], ["moo", 3.7]]], "duration": [0.11, 40.0, 0.77, 6.45]} \ No newline at end of file diff --git a/annotations_filtered/c7tvfdSjRE4_filtered.json b/annotations_filtered/c7tvfdSjRE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f3ca19675e693a91bcebfdc5a972eca99c550f2 --- /dev/null +++ b/annotations_filtered/c7tvfdSjRE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [6.0, 7.94], [12.0, 16.43], [19.0, 26.25], [28.0, 33.0], [34.0, 38.35], [39.0, 39.58], [41.0, 42.09], [43.0, 47.01], [50.0, 53.5], [55.0, 80.16], [87.0, 92.13], [92.0, 92.23], [93.0, 93.46], [96.0, 103.87], [104.0, 104.45], [104.0, 104.85], [107.0, 109.76], [121.0, 129.41], [139.0, 140.19], [152.0, 154.84], [156.0, 156.44], [156.0, 156.59], [159.0, 160.17], [173.0, 172.94]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.82, 37.07, 36.8, 35.81, 0.0, 0.0, 32.1, 32.32, 30.21, 32.02, 0.0, 0.0, 31.41, 0.0, 0.0, 32.55, 30.64, 0.0, 35.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bee, wasp, etc.", 31.17], ["fly, housefly", 27.36], ["insect", 12.21]], [["bee, wasp, etc.", 40.22], ["fly, housefly", 33.14], ["insect", 14.32]], [["vehicle", 22.3], ["fly, housefly", 13.36], ["speech", 10.75]], [["speech", 47.7], ["cattle, bovinae", 5.83], ["moo", 4.55]], null, null, [["cattle, bovinae", 39.57], ["moo", 24.31], ["livestock, farm animals, working animals", 21.24]], [["fly, housefly", 59.21], ["insect", 22.49], ["bee, wasp, etc.", 14.56]], [["mains hum", 24.04], ["music", 20.16], ["hum", 16.59]], [["speech", 34.63], ["fly, housefly", 15.39], ["fart", 8.73]], null, null, [["fly, housefly", 21.47], ["bee, wasp, etc.", 17.64], ["insect", 14.44]], null, null, [["vehicle", 43.63], ["car", 19.45], ["speech", 9.8]], [["fly, housefly", 42.26], ["insect", 20.41], ["bee, wasp, etc.", 9.0]], null, [["cattle, bovinae", 35.15], ["moo", 30.63], ["speech", 11.65]], null, null, null, null], "duration": [1.09, 1.94, 4.43, 7.25, 5.0, 4.35, 0.58, 1.09, 4.01, 3.5, 25.16, 5.13, 0.23, 0.46, 7.87, 0.45, 0.85, 2.76, 8.41, 1.19, 2.84, 0.44, 0.59, 1.17, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/c82FD6lh2LQ_filtered.json b/annotations_filtered/c82FD6lh2LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c79f764a3e095f4f647a19aee45298000278cf --- /dev/null +++ b/annotations_filtered/c82FD6lh2LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.68], [7.0, 8.38], [9.0, 15.38], [16.0, 47.44], [49.0, 72.72], [73.0, 77.45], [79.0, 89.58], [91.0, 90.98], [92.0, 92.47], [93.0, 99.33], [100.0, 105.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [87.19, 0.0, 98.1, 0.0, 53.91, 50.41, 31.56, 0.0, 0.0, 35.04, 40.64], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 27.94], ["music", 23.9], ["livestock, farm animals, working animals", 13.24]], null, null, [["speech", 38.98], ["music", 24.97], ["hum", 9.45]], [["speech", 24.73], ["music", 20.7], ["theremin", 13.69]]], "duration": [2.68, 1.38, 6.38, 31.44, 23.72, 4.45, 10.58, -0.02, 0.47, 6.33, 5.29]} \ No newline at end of file diff --git a/annotations_filtered/c8EodW2ossg_filtered.json b/annotations_filtered/c8EodW2ossg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8167da0712772ceb305de51070c8ce1a0a739166 --- /dev/null +++ b/annotations_filtered/c8EodW2ossg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.2], [3.0, 4.18], [6.0, 5.98], [7.0, 7.94], [9.0, 9.15], [10.0, 12.88], [15.0, 17.95], [19.0, 24.21], [26.0, 26.91], [29.0, 29.27], [31.0, 30.87], [36.0, 36.21], [41.0, 40.88], [47.0, 47.85], [48.0, 48.81], [49.0, 50.4], [53.0, 53.25], [56.0, 56.03], [60.0, 61.18], [62.0, 63.27], [70.0, 70.63], [71.0, 74.44], [76.0, 76.92], [78.0, 79.15], [81.0, 82.44], [83.0, 83.74], [85.0, 90.42], [92.0, 92.89], [95.0, 96.08], [103.0, 103.23], [104.0, 104.67], [106.0, 107.06], [109.0, 109.29], [111.0, 111.52], [115.0, 115.5], [119.0, 119.53], [121.0, 121.34], [128.0, 128.44], [134.0, 134.13], [136.0, 136.11], [137.0, 137.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 99.1, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.34, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 47.25], ["speech", 25.42], ["dial tone", 12.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 1.18, -0.02, 0.94, 0.15, 2.88, 2.95, 5.21, 0.91, 0.27, -0.13, 0.21, -0.12, 0.85, 0.81, 1.4, 0.25, 0.03, 1.18, 1.27, 0.63, 3.44, 0.92, 1.15, 1.44, 0.74, 5.42, 0.89, 1.08, 0.23, 0.67, 1.06, 0.29, 0.52, 0.5, 0.53, 0.34, 0.44, 0.13, 0.11, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/c8m6M4RV8p0_filtered.json b/annotations_filtered/c8m6M4RV8p0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b06651fb1454f64f62b34baba735c16e21d7aae4 --- /dev/null +++ b/annotations_filtered/c8m6M4RV8p0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.94], [12.0, 13.91], [14.0, 15.4], [22.0, 22.81], [26.0, 25.81], [27.0, 34.5], [37.0, 37.79], [40.0, 40.58], [42.0, 43.12], [55.0, 55.88], [56.0, 71.17], [76.0, 82.24], [86.0, 87.07], [89.0, 99.49], [102.0, 103.11], [104.0, 110.46], [113.0, 115.42], [117.0, 121.31], [128.0, 128.34], [134.0, 136.36], [143.0, 151.8]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.05, 0.0, 0.0, 0.0, 0.0, 31.6, 35.53, 0.0, 29.52, 0.0, 40.31, 33.02, 37.61, 0.0, 33.93, 31.65], "audiomae_on_audioset": [null, null, null, null, null, [["music", 23.86], ["livestock, farm animals, working animals", 14.53], ["didgeridoo", 11.99]], null, null, null, null, [["music", 32.27], ["boing", 12.03], ["whip", 9.16]], [["music", 38.5], ["tubular bells", 26.68], ["didgeridoo", 4.21]], null, [["theremin", 20.16], ["vehicle", 13.41], ["music", 12.08]], null, [["music", 28.34], ["speech", 26.37], ["creak", 4.23]], [["music", 11.31], ["chirp tone", 10.85], ["sine wave", 6.39]], [["music", 37.83], ["speech", 11.7], ["boing", 5.71]], null, [["music", 73.15], ["boing", 6.71], ["musical instrument", 4.36]], [["music", 76.07], ["carnatic music", 5.08], ["theremin", 4.84]]], "duration": [0.94, 1.91, 1.4, 0.81, -0.19, 7.5, 0.79, 0.58, 1.12, 0.88, 15.17, 6.24, 1.07, 10.49, 1.11, 6.46, 2.42, 4.31, 0.34, 2.36, 8.8]} \ No newline at end of file diff --git a/annotations_filtered/c8wj-v1Jdyc_filtered.json b/annotations_filtered/c8wj-v1Jdyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a0b0a73c8c1f605b1d86e59ba5ed67fe28506c8 --- /dev/null +++ b/annotations_filtered/c8wj-v1Jdyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.15]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.15]} \ No newline at end of file diff --git a/annotations_filtered/c93bejkDIuU_filtered.json b/annotations_filtered/c93bejkDIuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48b3af3621376b71ea572fe990dd045a38bd15e1 --- /dev/null +++ b/annotations_filtered/c93bejkDIuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [13.0, 23.67], [24.0, 26.54], [27.0, 30.47], [38.0, 38.42], [42.0, 42.85], [44.0, 45.96], [48.0, 49.82], [55.0, 56.07], [63.0, 63.86], [64.0, 64.74], [67.0, 69.18], [71.0, 71.04], [76.0, 76.74], [78.0, 78.71]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.53, 49.31, 41.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 27.58], ["music", 19.06], ["hum", 16.12]], [["hum", 29.87], ["mains hum", 21.17], ["static", 7.82]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 10.67, 2.54, 3.47, 0.42, 0.85, 1.96, 1.82, 1.07, 0.86, 0.74, 2.18, 0.04, 0.74, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/c94JyVrcWwE_filtered.json b/annotations_filtered/c94JyVrcWwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3ff41af4e3ee2f9e70056146ceca09488408d8c --- /dev/null +++ b/annotations_filtered/c94JyVrcWwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.39], [13.0, 25.76], [28.0, 28.12], [30.0, 30.0], [30.0, 30.96], [32.0, 34.62], [36.0, 89.34], [90.0, 90.26], [91.0, 105.44], [108.0, 116.01], [119.0, 120.01], [121.0, 120.72], [121.0, 121.81], [123.0, 123.45], [125.0, 128.44]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [33.5, 31.05, 0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 29.12, 56.86, 0.0, 0.0, 0.0, 0.0, 64.63], "audiomae_on_audioset": [[["music", 37.77], ["speech", 31.75], ["synthesizer", 8.14]], [["music", 32.96], ["throbbing", 26.65], ["hum", 18.2]], null, null, null, [["music", 28.18], ["hum", 16.09], ["whale vocalization", 14.5]], null, null, [["music", 49.81], ["cacophony", 3.76], ["noise", 3.5]], null, null, null, null, null, null], "duration": [3.39, 12.76, 0.12, 0.0, 0.96, 2.62, 53.34, 0.26, 14.44, 8.01, 1.01, -0.28, 0.81, 0.45, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/c95YKkIbTGg_filtered.json b/annotations_filtered/c95YKkIbTGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aaf3521933ce7a9f805c412dfa1b842ab115690 --- /dev/null +++ b/annotations_filtered/c95YKkIbTGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 21.69], [24.0, 24.38], [33.0, 52.96], [54.0, 59.53], [60.0, 61.72], [62.0, 62.75], [65.0, 68.05], [69.0, 69.72], [71.0, 85.92], [87.0, 103.67], [105.0, 163.97], [166.0, 166.6]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false], "silence_prob": [64.63, 0.0, 32.48, 39.86, 0.0, 0.0, 34.78, 0.0, 32.09, 34.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.92], ["buzz", 13.43], ["noise", 5.75]], [["music", 35.16], ["didgeridoo", 15.9], ["effects unit", 9.13]], null, null, [["music", 40.09], ["hum", 12.56], ["speech", 11.47]], null, [["music", 66.25], ["hum", 6.25], ["mains hum", 3.65]], [["music", 44.22], ["didgeridoo", 18.74], ["hum", 8.89]], null, null], "duration": [12.69, 0.38, 19.96, 5.53, 1.72, 0.75, 3.05, 0.72, 14.92, 16.67, 58.97, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/c9FCOAEPHHM_filtered.json b/annotations_filtered/c9FCOAEPHHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfff93663ad1301d1afae93789803c1cd925d5d5 --- /dev/null +++ b/annotations_filtered/c9FCOAEPHHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[78.0, 86.07], [86.0, 87.17], [101.0, 101.33], [107.0, 107.59], [111.0, 111.55], [113.0, 116.73], [120.0, 129.14]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [31.02, 0.0, 0.0, 0.0, 0.0, 45.18, 33.55], "audiomae_on_audioset": [[["music", 66.46], ["hum", 13.24], ["throbbing", 4.44]], null, null, null, null, [["music", 70.11], ["throbbing", 4.13], ["musical instrument", 3.27]], [["music", 58.71], ["hum", 7.93], ["throbbing", 5.04]]], "duration": [8.07, 1.17, 0.33, 0.59, 0.55, 3.73, 9.14]} \ No newline at end of file diff --git a/annotations_filtered/c9O1VVeMzhc_filtered.json b/annotations_filtered/c9O1VVeMzhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73008bc1a4a30ba0e8ddb1151f9809c2a9c1e0ef --- /dev/null +++ b/annotations_filtered/c9O1VVeMzhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [5.0, 5.21], [6.0, 8.55], [10.0, 10.37], [11.0, 12.26], [13.0, 14.49], [17.0, 17.85], [20.0, 20.34], [24.0, 24.44], [25.0, 25.49], [27.0, 27.01], [29.0, 29.2], [31.0, 31.35], [32.0, 32.91], [35.0, 34.7], [37.0, 37.44], [40.0, 41.39], [42.0, 42.45], [43.0, 43.28], [44.0, 44.69], [51.0, 52.05], [53.0, 54.68], [56.0, 56.88], [58.0, 58.29], [60.0, 60.13], [62.0, 62.13], [63.0, 63.85], [68.0, 68.62], [73.0, 73.74], [77.0, 78.49], [80.0, 80.79], [82.0, 87.56], [97.0, 97.51], [100.0, 100.28], [102.0, 104.7], [106.0, 107.43], [108.0, 109.38]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 67.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["thunk", 26.87], ["thump, thud", 9.42], ["hum", 8.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.21, 2.55, 0.37, 1.26, 1.49, 0.85, 0.34, 0.44, 0.49, 0.01, 0.2, 0.35, 0.91, -0.3, 0.44, 1.39, 0.45, 0.28, 0.69, 1.05, 1.68, 0.88, 0.29, 0.13, 0.13, 0.85, 0.62, 0.74, 1.49, 0.79, 5.56, 0.51, 0.28, 2.7, 1.43, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/c9YJ-KJZKyY_filtered.json b/annotations_filtered/c9YJ-KJZKyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e985b91b1b6ac541e6d14eabe3b88eb6d4d9970 --- /dev/null +++ b/annotations_filtered/c9YJ-KJZKyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.9], [13.0, 13.37], [14.0, 16.75], [19.0, 19.52], [20.0, 21.69], [42.0, 42.15], [46.0, 46.53], [70.0, 70.98], [74.0, 74.43], [85.0, 85.19], [86.0, 86.61], [88.0, 97.48], [105.0, 118.35], [120.0, 120.8], [142.0, 151.26], [164.0, 165.79], [175.0, 176.0], [181.0, 181.4], [182.0, 183.1], [185.0, 200.3], [205.0, 213.51], [216.0, 225.81]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [37.59, 0.0, 38.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.79, 42.33, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 35.85, 32.25, 41.12], "audiomae_on_audioset": [[["music", 32.89], ["livestock, farm animals, working animals", 5.48], ["animal", 4.47]], null, [["speech", 31.37], ["music", 24.22], ["boing", 6.14]], null, null, null, null, null, null, null, null, [["music", 71.85], ["musical instrument", 2.27], ["speech", 1.65]], [["music", 45.39], ["speech", 31.46], ["outside, rural or natural", 2.91]], null, [["noise", 38.36], ["speech", 25.91], ["music", 17.49]], null, null, null, null, [["music", 70.19], ["synthesizer", 4.65], ["hum", 4.06]], [["speech", 44.29], ["music", 14.36], ["vehicle", 6.53]], [["speech", 28.5], ["music", 19.78], ["whimper", 6.36]]], "duration": [2.9, 0.37, 2.75, 0.52, 1.69, 0.15, 0.53, 0.98, 0.43, 0.19, 0.61, 9.48, 13.35, 0.8, 9.26, 1.79, 1.0, 0.4, 1.1, 15.3, 8.51, 9.81]} \ No newline at end of file diff --git a/annotations_filtered/c9_46Iv_GGM_filtered.json b/annotations_filtered/c9_46Iv_GGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9020b0243bc002d3a867999db1fa21fa8d1246ee --- /dev/null +++ b/annotations_filtered/c9_46Iv_GGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.54], [6.0, 7.55], [10.0, 13.07], [14.0, 14.39], [15.0, 22.57], [24.0, 24.73], [27.0, 28.48], [30.0, 30.62], [32.0, 39.7]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 0.0, 96.17, 0.0, 73.51, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.54, 1.55, 3.07, 0.39, 7.57, 0.73, 1.48, 0.62, 7.7]} \ No newline at end of file diff --git a/annotations_filtered/c9cV7bFKMNQ_filtered.json b/annotations_filtered/c9cV7bFKMNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78e20e695b3e148555a543298e609771ff744544 --- /dev/null +++ b/annotations_filtered/c9cV7bFKMNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.91], [26.0, 37.3], [39.0, 39.6], [40.0, 48.42], [49.0, 51.95], [53.0, 54.14]], "keep_status": [true, false, false, false, false, false], "silence_prob": [33.73, 54.9, 0.0, 68.8, 90.08, 0.0], "audiomae_on_audioset": [[["insect", 19.33], ["music", 18.07], ["fly, housefly", 12.49]], null, null, null, null, null], "duration": [13.91, 11.3, 0.6, 8.42, 2.95, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/c9oE47YW6YM_filtered.json b/annotations_filtered/c9oE47YW6YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f1be0ea48893b24803465c5106436a631857b88 --- /dev/null +++ b/annotations_filtered/c9oE47YW6YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.46], [14.0, 14.55], [15.0, 20.43], [21.0, 37.74], [38.0, 39.58], [41.0, 41.49], [43.0, 44.49], [49.0, 51.33], [52.0, 52.42], [53.0, 53.54], [54.0, 54.97], [56.0, 55.8], [56.0, 57.32], [59.0, 59.59], [62.0, 62.16], [63.0, 64.29], [68.0, 70.9], [79.0, 106.98], [108.0, 109.85], [112.0, 113.21], [115.0, 119.4], [123.0, 125.44], [127.0, 129.3]], "keep_status": [false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [40.09, 0.0, 39.37, 36.88, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.85, 42.51, 0.0, 0.0, 43.58, 57.01, 57.72], "audiomae_on_audioset": [[["music", 61.08], ["speech", 8.07], ["electronic music", 3.53]], null, [["music", 30.65], ["speech", 26.71], ["singing bowl", 4.88]], [["music", 33.31], ["ambient music", 12.89], ["hum", 10.16]], null, null, null, [["sidetone", 17.43], ["music", 16.19], ["speech", 15.9]], null, null, null, null, null, null, null, null, [["speech", 33.25], ["aircraft", 17.78], ["fixed-wing aircraft, airplane", 7.87]], [["hum", 57.92], ["mains hum", 20.7], ["throbbing", 17.3]], null, null, [["music", 23.99], ["hum", 23.43], ["throbbing", 11.73]], null, null], "duration": [2.46, 0.55, 5.43, 16.74, 1.58, 0.49, 1.49, 2.33, 0.42, 0.54, 0.97, -0.2, 1.32, 0.59, 0.16, 1.29, 2.9, 27.98, 1.85, 1.21, 4.4, 2.44, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/c9vl9Rurcc8_filtered.json b/annotations_filtered/c9vl9Rurcc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22124cc6819396b182ce52fb123cc590ea49d409 --- /dev/null +++ b/annotations_filtered/c9vl9Rurcc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [5.0, 19.94], [22.0, 23.01], [24.0, 24.53], [26.0, 39.02], [42.0, 45.32], [53.0, 62.38], [66.0, 68.91], [72.0, 72.2], [74.0, 81.41], [83.0, 90.02], [92.0, 92.5], [101.0, 101.65], [103.0, 103.76], [111.0, 111.21], [112.0, 112.6], [117.0, 117.98], [119.0, 119.21], [121.0, 123.94]], "keep_status": [true, true, false, false, true, true, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [31.33, 33.17, 0.0, 0.0, 40.54, 35.35, 42.28, 30.55, 0.0, 30.26, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3], "audiomae_on_audioset": [[["speech", 41.07], ["music", 10.08], ["vehicle", 5.28]], [["speech", 46.65], ["music", 11.41], ["hum", 7.82]], null, null, [["music", 15.73], ["hum", 7.71], ["noise", 5.83]], [["fly, housefly", 18.17], ["speech", 12.99], ["mosquito", 11.7]], [["music", 48.03], ["didgeridoo", 15.29], ["speech", 5.81]], [["music", 56.76], ["speech", 10.62], ["guitar", 9.22]], null, [["music", 50.72], ["hum", 7.07], ["mains hum", 5.17]], [["speech", 33.81], ["music", 27.9], ["explosion", 7.53]], null, null, null, null, null, null, null, null], "duration": [3.44, 14.94, 1.01, 0.53, 13.02, 3.32, 9.38, 2.91, 0.2, 7.41, 7.02, 0.5, 0.65, 0.76, 0.21, 0.6, 0.98, 0.21, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/c9wVzDytTFU_filtered.json b/annotations_filtered/c9wVzDytTFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e5c42b4e44bdf3a6dc0f855aeeb56dbfd5dd466 --- /dev/null +++ b/annotations_filtered/c9wVzDytTFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.9], [17.0, 47.97], [51.0, 60.91], [65.0, 66.14], [68.0, 72.06], [76.0, 81.89], [84.0, 132.95], [145.0, 164.64]], "keep_status": [false, false, true, false, true, true, false, true], "silence_prob": [33.15, 0.0, 31.47, 0.0, 30.51, 31.66, 0.0, 30.7], "audiomae_on_audioset": [[["speech", 65.72], ["music", 9.82], ["vehicle", 5.8]], null, [["speech", 33.25], ["vehicle", 18.86], ["sidetone", 9.11]], null, [["speech", 44.72], ["crowd", 6.75], ["vehicle", 4.86]], [["music", 24.31], ["vehicle", 13.36], ["speech", 9.14]], null, [["music", 29.33], ["hum", 22.07], ["mains hum", 18.05]]], "duration": [6.9, 30.97, 9.91, 1.14, 4.06, 5.89, 48.95, 19.64]} \ No newline at end of file diff --git a/annotations_filtered/c9xahfssbQg_filtered.json b/annotations_filtered/c9xahfssbQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf1b3beee990a47c1c6b630434ece90c5151ea4 --- /dev/null +++ b/annotations_filtered/c9xahfssbQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.98], [38.0, 37.94], [39.0, 39.45], [41.0, 43.83]], "keep_status": [true, false, false, true], "silence_prob": [49.68, 0.0, 0.0, 46.36], "audiomae_on_audioset": [[["mechanisms", 9.37], ["creak", 8.55], ["quack", 8.33]], null, null, [["fart", 48.66], ["stomach rumble", 10.47], ["creak", 8.43]]], "duration": [6.98, -0.06, 0.45, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/cA-laLpcLIw_filtered.json b/annotations_filtered/cA-laLpcLIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4c9f07192f7fee311c27e3a8124b2808e6305b --- /dev/null +++ b/annotations_filtered/cA-laLpcLIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [6.0, 9.22], [13.0, 50.75], [52.0, 57.54], [62.0, 62.26], [65.0, 65.57], [67.0, 70.02], [72.0, 86.66], [91.0, 93.8], [95.0, 95.69], [97.0, 106.29], [107.0, 133.17], [138.0, 138.13], [139.0, 141.76], [144.0, 155.98], [156.0, 165.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 43.85, 0.0, 35.95, 0.0, 0.0, 46.61, 41.83, 54.3, 0.0, 47.62, 41.18, 0.0, 47.5, 47.98, 95.09], "audiomae_on_audioset": [null, [["music", 33.49], ["synthesizer", 6.62], ["buzzer", 4.21]], null, [["music", 79.36], ["electronic music", 5.43], ["synthesizer", 1.94]], null, null, [["music", 46.56], ["didgeridoo", 38.49], ["musical instrument", 2.18]], [["music", 73.72], ["didgeridoo", 4.78], ["musical instrument", 2.94]], null, null, [["music", 44.1], ["vehicle", 8.38], ["outside, rural or natural", 3.36]], [["music", 48.49], ["fly, housefly", 7.29], ["speech", 5.91]], null, [["music", 43.93], ["throbbing", 11.55], ["hum", 8.04]], [["music", 56.57], ["electronic music", 7.22], ["didgeridoo", 4.8]], null], "duration": [0.43, 3.22, 37.75, 5.54, 0.26, 0.57, 3.02, 14.66, 2.8, 0.69, 9.29, 26.17, 0.13, 2.76, 11.98, 9.75]} \ No newline at end of file diff --git a/annotations_filtered/cAIHoTstrTg_filtered.json b/annotations_filtered/cAIHoTstrTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d9d2ddc1826b7d2da2ed0cc95d51dac60ef6643 --- /dev/null +++ b/annotations_filtered/cAIHoTstrTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [6.0, 6.08], [9.0, 10.39], [12.0, 13.04], [20.0, 21.1], [21.0, 21.69], [24.0, 23.99], [24.0, 24.76], [27.0, 27.21], [29.0, 30.43], [31.0, 32.16], [33.0, 33.67], [36.0, 36.12], [50.0, 51.26], [55.0, 56.2], [60.0, 61.45], [63.0, 69.08], [73.0, 73.5], [86.0, 87.93], [89.0, 99.15], [102.0, 104.18], [106.0, 105.76], [107.0, 116.68], [117.0, 123.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 35.42, 100.0, 0.0, 31.19, 30.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.73], ["whoosh, swoosh, swish", 10.88], ["boing", 7.35]], null, null, [["speech", 34.91], ["noise", 30.89], ["cacophony", 5.04]], [["speech", 62.92], ["explosion", 10.45], ["eruption", 4.03]]], "duration": [0.78, 0.08, 1.39, 1.04, 1.1, 0.69, -0.01, 0.76, 0.21, 1.43, 1.16, 0.67, 0.12, 1.26, 1.2, 1.45, 6.08, 0.5, 1.93, 10.15, 2.18, -0.24, 9.68, 6.06]} \ No newline at end of file diff --git a/annotations_filtered/cAKtpCo8fPE_filtered.json b/annotations_filtered/cAKtpCo8fPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..073ef391a596e9cc1481eefa9b0bdb497705ca8c --- /dev/null +++ b/annotations_filtered/cAKtpCo8fPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.16], [10.0, 11.43], [13.0, 15.63], [16.0, 19.7], [21.0, 21.1], [21.0, 21.84], [23.0, 24.12], [25.0, 27.48], [29.0, 29.64], [30.0, 31.68], [33.0, 36.81], [38.0, 47.19], [49.0, 67.74], [68.0, 70.39], [72.0, 73.28], [74.0, 75.93], [77.0, 78.36], [79.0, 81.23], [81.0, 81.35], [82.0, 85.99], [88.0, 89.38], [90.0, 90.46], [93.0, 96.45], [97.0, 107.03], [108.0, 117.58], [119.0, 121.76], [123.0, 122.94], [126.0, 126.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [99.48, 0.0, 99.94, 84.43, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 99.78, 50.97, 83.16, 99.9, 0.0, 0.0, 0.0, 64.63, 0.0, 99.36, 0.0, 0.0, 99.62, 41.64, 73.82, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 32.18], ["radio", 6.28], ["noise", 4.44]], null, null, null, null], "duration": [2.16, 1.43, 2.63, 3.7, 0.1, 0.84, 1.12, 2.48, 0.64, 1.68, 3.81, 9.19, 18.74, 2.39, 1.28, 1.93, 1.36, 2.23, 0.35, 3.99, 1.38, 0.46, 3.45, 10.03, 9.58, 2.76, -0.06, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/cAYVS8aRQ1U_filtered.json b/annotations_filtered/cAYVS8aRQ1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..686f64a058aee02505b99f06371558fcb80594d9 --- /dev/null +++ b/annotations_filtered/cAYVS8aRQ1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [3.0, 6.44], [7.0, 9.42], [10.0, 13.14], [14.0, 16.44], [17.0, 18.96], [21.0, 22.84], [24.0, 26.79], [28.0, 30.35], [34.0, 37.94], [40.0, 43.19], [44.0, 48.17], [50.0, 51.41], [53.0, 60.96], [62.0, 73.28], [74.0, 87.57], [89.0, 91.18], [93.0, 95.1], [96.0, 98.27], [99.0, 102.78], [104.0, 107.84], [110.0, 112.53], [114.0, 115.48], [117.0, 120.82], [121.0, 123.09], [124.0, 131.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.31, 69.74, 62.99, 82.97, 0.0, 0.0, 95.51, 62.07, 77.7, 71.29, 91.47, 0.0, 69.34, 88.28, 91.13, 96.17, 91.47, 87.74, 82.25, 68.54, 93.91, 0.0, 93.29, 82.97, 86.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 3.44, 2.42, 3.14, 2.44, 1.96, 1.84, 2.79, 2.35, 3.94, 3.19, 4.17, 1.41, 7.96, 11.28, 13.57, 2.18, 2.1, 2.27, 3.78, 3.84, 2.53, 1.48, 3.82, 2.09, 7.06]} \ No newline at end of file diff --git a/annotations_filtered/cBFrfA6TrB0_filtered.json b/annotations_filtered/cBFrfA6TrB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e250164d7ca1012459964e93bb533e341bec2ea --- /dev/null +++ b/annotations_filtered/cBFrfA6TrB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [6.0, 7.77], [12.0, 12.87], [14.0, 13.95], [15.0, 15.01], [17.0, 19.77], [22.0, 23.3], [24.0, 26.5], [29.0, 31.43], [33.0, 33.66], [34.0, 34.35], [35.0, 38.75], [42.0, 42.28], [48.0, 49.57], [51.0, 51.16], [52.0, 51.56], [52.0, 51.93], [52.0, 54.04], [57.0, 60.45], [62.0, 65.48], [68.0, 68.79], [73.0, 73.6], [76.0, 80.84], [82.0, 86.02], [87.0, 88.84], [89.0, 94.83], [97.0, 99.05], [101.0, 104.01], [106.0, 136.19], [137.0, 138.79], [139.0, 142.03], [144.0, 162.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 80.46, 76.86, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 70.44, 48.61, 0.0, 0.0, 35.32, 45.49, 0.0, 77.2, 99.1, 43.53, 0.0, 0.0, 64.52, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 46.0], ["throbbing", 11.7], ["stomach rumble", 11.04]], null, null, [["music", 46.9], ["animal", 6.97], ["livestock, farm animals, working animals", 6.64]], [["music", 50.8], ["eruption", 4.51], ["speech", 4.0]], null, null, null, [["music", 21.34], ["bleat", 18.74], ["sheep", 17.9]], null, null, null, null], "duration": [0.64, 1.77, 0.87, -0.05, 0.01, 2.77, 1.3, 2.5, 2.43, 0.66, 0.35, 3.75, 0.28, 1.57, 0.16, -0.44, -0.07, 2.04, 3.45, 3.48, 0.79, 0.6, 4.84, 4.02, 1.84, 5.83, 2.05, 3.01, 30.19, 1.79, 3.03, 18.43]} \ No newline at end of file diff --git a/annotations_filtered/cBHvRuBtJqI_filtered.json b/annotations_filtered/cBHvRuBtJqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55705d3f167c6c42561f156faacbb3eca0c42b5b --- /dev/null +++ b/annotations_filtered/cBHvRuBtJqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [5.0, 5.8], [8.0, 9.61], [19.0, 25.81], [26.0, 27.21], [39.0, 39.12], [42.0, 42.21], [43.0, 43.33], [44.0, 44.74], [51.0, 51.9], [57.0, 58.18], [61.0, 61.75], [62.0, 62.8], [65.0, 65.58], [66.0, 66.55], [69.0, 69.3], [70.0, 70.95], [78.0, 78.54], [85.0, 98.25], [99.0, 101.83], [103.0, 103.32], [104.0, 106.68], [108.0, 113.0], [114.0, 114.79], [116.0, 124.55]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 98.1, 0.0, 65.91, 76.37, 0.0, 51.34], "audiomae_on_audioset": [null, null, null, [["creak", 12.22], ["wild animals", 7.84], ["animal", 7.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.72], ["wind instrument, woodwind instrument", 4.28], ["theremin", 4.0]], null, null, null, null, null, null], "duration": [0.39, 0.8, 1.61, 6.81, 1.21, 0.12, 0.21, 0.33, 0.74, 0.9, 1.18, 0.75, 0.8, 0.58, 0.55, 0.3, 0.95, 0.54, 13.25, 2.83, 0.32, 2.68, 5.0, 0.79, 8.55]} \ No newline at end of file diff --git a/annotations_filtered/cCNhONF1lHI_filtered.json b/annotations_filtered/cCNhONF1lHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cefe308fb09d17fb6a593ea2195cc43a8a70a80 --- /dev/null +++ b/annotations_filtered/cCNhONF1lHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [17.0, 18.55], [20.0, 20.68], [21.0, 21.88], [22.0, 26.27], [28.0, 29.0], [29.0, 30.75], [31.0, 32.31], [34.0, 34.59], [36.0, 36.24], [41.0, 42.65], [46.0, 45.94], [47.0, 47.55], [55.0, 56.29], [62.0, 62.21], [64.0, 65.13], [67.0, 68.39], [69.0, 69.82], [71.0, 71.81], [77.0, 77.77], [80.0, 80.4], [84.0, 85.7], [86.0, 89.95], [91.0, 91.69], [93.0, 93.87], [95.0, 96.97], [97.0, 98.71], [101.0, 101.83], [105.0, 105.24], [106.0, 107.13], [115.0, 115.42], [119.0, 120.45], [121.0, 121.24], [122.0, 122.55], [123.0, 124.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 1.55, 0.68, 0.88, 4.27, 1.0, 1.75, 1.31, 0.59, 0.24, 1.65, -0.06, 0.55, 1.29, 0.21, 1.13, 1.39, 0.82, 0.81, 0.77, 0.4, 1.7, 3.95, 0.69, 0.87, 1.97, 1.71, 0.83, 0.24, 1.13, 0.42, 1.45, 0.24, 0.55, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/cCoD237oWtg_filtered.json b/annotations_filtered/cCoD237oWtg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26277a5464bcd9857686d02aa2ab3472110390f8 --- /dev/null +++ b/annotations_filtered/cCoD237oWtg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [9.0, 9.49], [11.0, 11.94], [19.0, 18.99], [31.0, 30.96], [46.0, 47.56], [55.0, 56.19], [82.0, 85.35], [88.0, 87.64], [100.0, 100.9], [116.0, 125.61]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.69, 0.0, 0.0, 30.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 23.47], ["vehicle", 14.36], ["car", 10.23]], null, null, [["speech", 28.7], ["music", 12.99], ["whale vocalization", 8.79]]], "duration": [0.4, 0.49, 0.94, -0.01, -0.04, 1.56, 1.19, 3.35, -0.36, 0.9, 9.61]} \ No newline at end of file diff --git a/annotations_filtered/cCpDJlAnHsg_filtered.json b/annotations_filtered/cCpDJlAnHsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd6259997ced493f4754c762c14617fae17203e --- /dev/null +++ b/annotations_filtered/cCpDJlAnHsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.54], [14.0, 16.8], [26.0, 29.35], [30.0, 124.58], [126.0, 128.02], [133.0, 135.35], [137.0, 137.44]], "keep_status": [true, false, false, false, true, true, false], "silence_prob": [49.87, 57.48, 53.65, 0.0, 37.96, 39.52, 0.0], "audiomae_on_audioset": [[["music", 45.85], ["speech", 7.51], ["drum machine", 6.09]], null, null, null, [["music", 48.17], ["synthesizer", 5.49], ["scary music", 5.35]], [["speech", 25.2], ["music", 10.6], ["throbbing", 10.44]], null], "duration": [2.54, 2.8, 3.35, 94.58, 2.02, 2.35, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/cCwn-ROhwyo_filtered.json b/annotations_filtered/cCwn-ROhwyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501b15422302bd66d75b632a0e459dffb241ad18 --- /dev/null +++ b/annotations_filtered/cCwn-ROhwyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.76], [28.0, 204.3], [205.0, 208.63], [210.0, 211.25], [211.0, 211.4], [211.0, 211.89], [214.0, 243.18]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 36.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.31], ["rumble", 14.59], ["singing bowl", 14.51]]], "duration": [0.76, 176.3, 3.63, 1.25, 0.4, 0.89, 29.18]} \ No newline at end of file diff --git a/annotations_filtered/cDI9o67o7bo_filtered.json b/annotations_filtered/cDI9o67o7bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b0f3c139a832bcd7a06b0f95f141acca676a78c --- /dev/null +++ b/annotations_filtered/cDI9o67o7bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.81], [16.0, 40.51], [41.0, 43.16], [44.0, 44.29], [47.0, 49.22], [51.0, 52.88], [55.0, 55.8], [57.0, 58.55], [63.0, 65.58], [67.0, 68.79], [70.0, 70.61], [73.0, 85.43], [86.0, 87.78], [89.0, 90.85], [92.0, 92.37], [93.0, 93.99], [97.0, 97.38], [98.0, 98.47], [101.0, 101.92], [103.0, 103.65], [105.0, 106.52], [107.0, 114.89], [116.0, 115.94], [117.0, 118.57]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.26, 77.53, 0.0, 100.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0], "audiomae_on_audioset": [null, [["gunshot, gunfire", 21.65], ["artillery fire", 15.51], ["explosion", 14.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 24.51, 2.16, 0.29, 2.22, 1.88, 0.8, 1.55, 2.58, 1.79, 0.61, 12.43, 1.78, 1.85, 0.37, 0.99, 0.38, 0.47, 0.92, 0.65, 1.52, 7.89, -0.06, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/cDfQo1ANeLM_filtered.json b/annotations_filtered/cDfQo1ANeLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8defd12f450694f5263c83b913588852c4fac81d --- /dev/null +++ b/annotations_filtered/cDfQo1ANeLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [9.0, 15.3], [18.0, 19.57], [20.0, 21.9], [37.0, 37.5], [47.0, 47.83], [49.0, 50.09], [51.0, 51.09], [52.0, 52.57], [55.0, 55.66], [59.0, 59.36], [62.0, 63.21], [66.0, 70.6], [72.0, 74.68], [75.0, 75.91], [76.0, 81.55], [83.0, 85.26], [123.0, 126.89], [127.0, 131.75]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [28.52, 37.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.64, 52.62, 0.0, 31.68, 60.32, 98.86, 39.35], "audiomae_on_audioset": [[["zipper (clothing)", 18.95], ["fart", 8.25], ["whoosh, swoosh, swish", 6.67]], [["speech", 13.95], ["boing", 12.05], ["livestock, farm animals, working animals", 8.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 25.01], ["didgeridoo", 15.1], ["noise", 7.84]], null, null, [["speech", 79.81], ["music", 4.47], ["synthesizer", 1.86]]], "duration": [2.74, 6.3, 1.57, 1.9, 0.5, 0.83, 1.09, 0.09, 0.57, 0.66, 0.36, 1.21, 4.6, 2.68, 0.91, 5.55, 2.26, 3.89, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/cDoyywKt1_0_filtered.json b/annotations_filtered/cDoyywKt1_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..961174fce3395be46da3792d9b12ff5d3216797d --- /dev/null +++ b/annotations_filtered/cDoyywKt1_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [8.0, 7.77], [8.0, 9.29], [10.0, 10.86], [11.0, 35.29], [36.0, 52.57], [56.0, 64.76], [69.0, 86.12], [89.0, 91.07], [92.0, 91.99], [93.0, 98.12], [100.0, 113.53], [119.0, 120.88], [126.0, 128.26], [130.0, 130.54], [132.0, 133.64], [135.0, 135.31], [136.0, 136.58], [139.0, 148.17], [149.0, 150.08], [151.0, 154.58], [160.0, 161.15], [162.0, 175.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.86, 94.81, 87.92, 92.8, 92.97, 0.0, 59.59, 49.13, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 56.1, 0.0, 42.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.84], ["musical instrument", 5.17], ["hum", 3.93]], null, null, null, null, null, null, null, null, null, null, [["music", 62.84], ["sheep", 4.74], ["bleat", 2.9]]], "duration": [0.45, -0.23, 1.29, 0.86, 24.29, 16.57, 8.76, 17.12, 2.07, -0.01, 5.12, 13.53, 1.88, 2.26, 0.54, 1.64, 0.31, 0.58, 9.17, 1.08, 3.58, 1.15, 13.36]} \ No newline at end of file diff --git a/annotations_filtered/cDpI6Zzy-vo_filtered.json b/annotations_filtered/cDpI6Zzy-vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4d3fee92fd5a6713a09321ed6864a53acd0432f --- /dev/null +++ b/annotations_filtered/cDpI6Zzy-vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [8.0, 8.99], [18.0, 18.94], [22.0, 33.12], [35.0, 54.53], [56.0, 57.47]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.05, 31.08, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 75.34], ["throbbing", 3.66], ["hum", 2.47]], [["music", 54.48], ["speech", 29.14], ["throbbing", 4.31]], null], "duration": [1.17, 0.99, 0.94, 11.12, 19.53, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/cE2bc0vU9pg_filtered.json b/annotations_filtered/cE2bc0vU9pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e36ae347cfb7b9765f81da86be7185c81c2bd3fd --- /dev/null +++ b/annotations_filtered/cE2bc0vU9pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.35], [13.0, 16.34], [20.0, 20.63], [21.0, 22.64], [28.0, 28.95], [31.0, 36.68], [41.0, 42.99], [44.0, 45.06], [47.0, 47.78], [50.0, 50.55], [51.0, 52.41], [58.0, 60.42], [66.0, 66.19], [71.0, 71.47], [77.0, 78.43], [86.0, 88.52], [89.0, 89.58], [91.0, 92.06], [96.0, 97.38], [99.0, 99.25], [110.0, 111.87], [114.0, 114.86], [116.0, 117.76], [119.0, 120.04], [122.0, 123.38], [124.0, 125.61], [129.0, 130.6], [132.0, 132.76], [134.0, 135.43], [140.0, 141.35], [143.0, 145.18], [152.0, 153.47], [155.0, 156.34], [158.0, 159.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.62, 71.57, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.35, 3.34, 0.63, 1.64, 0.95, 5.68, 1.99, 1.06, 0.78, 0.55, 1.41, 2.42, 0.19, 0.47, 1.43, 2.52, 0.58, 1.06, 1.38, 0.25, 1.87, 0.86, 1.76, 1.04, 1.38, 1.61, 1.6, 0.76, 1.43, 1.35, 2.18, 1.47, 1.34, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/cE5l32W6Oxc_filtered.json b/annotations_filtered/cE5l32W6Oxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2b702b90fc6769276a5f0f325cd72a1fab8c13c --- /dev/null +++ b/annotations_filtered/cE5l32W6Oxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [5.0, 5.76], [6.0, 6.94], [7.0, 9.31], [11.0, 22.05], [23.0, 25.54], [26.0, 27.23], [28.0, 28.56], [31.0, 33.39], [36.0, 42.23], [46.0, 51.31], [53.0, 53.86], [56.0, 64.81], [65.0, 69.42], [71.0, 73.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.16, 94.95, 90.6, 0.0, 0.0, 99.4, 96.66, 96.42, 0.0, 92.48, 73.36, 96.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.76, 0.94, 2.31, 11.05, 2.54, 1.23, 0.56, 2.39, 6.23, 5.31, 0.86, 8.81, 4.42, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/cE71I4X9hWQ_filtered.json b/annotations_filtered/cE71I4X9hWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a2d4697927cd091c0e3a44b9b4b6f46ce6d2396 --- /dev/null +++ b/annotations_filtered/cE71I4X9hWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.83], [10.0, 11.67], [12.0, 12.29], [14.0, 18.32], [21.0, 22.76], [24.0, 27.9], [28.0, 30.11], [31.0, 33.79], [35.0, 42.7], [43.0, 92.16], [93.0, 96.57], [97.0, 99.18], [101.0, 106.57], [108.0, 115.43], [116.0, 140.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 99.99, 99.98, 100.0, 0.0, 98.8, 86.45, 100.0, 100.0, 70.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.67, 0.29, 4.32, 1.76, 3.9, 2.11, 2.79, 7.7, 49.16, 3.57, 2.18, 5.57, 7.43, 24.04]} \ No newline at end of file diff --git a/annotations_filtered/cEJhVm0TJUQ_filtered.json b/annotations_filtered/cEJhVm0TJUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..091a2084d5bba4f36240f4e22ba894502c3885ff --- /dev/null +++ b/annotations_filtered/cEJhVm0TJUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.91], [8.0, 9.34], [10.0, 11.75], [13.0, 13.31], [15.0, 15.06], [17.0, 17.2], [19.0, 19.43], [22.0, 22.59], [27.0, 27.78], [29.0, 29.71], [31.0, 37.07], [37.0, 38.58], [39.0, 41.52], [42.0, 43.82], [45.0, 45.59], [46.0, 47.09], [48.0, 49.25], [51.0, 51.14], [53.0, 53.62], [55.0, 54.89], [56.0, 56.76], [58.0, 59.71], [61.0, 62.19], [64.0, 65.3], [66.0, 66.75], [69.0, 69.99], [73.0, 73.82], [75.0, 79.78], [80.0, 81.57], [82.0, 83.2], [87.0, 88.01], [90.0, 91.15], [93.0, 93.93], [95.0, 96.06], [99.0, 99.69], [102.0, 102.83], [107.0, 107.69], [109.0, 109.56], [111.0, 111.55], [113.0, 113.61], [118.0, 118.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.91, 1.34, 1.75, 0.31, 0.06, 0.2, 0.43, 0.59, 0.78, 0.71, 6.07, 1.58, 2.52, 1.82, 0.59, 1.09, 1.25, 0.14, 0.62, -0.11, 0.76, 1.71, 1.19, 1.3, 0.75, 0.99, 0.82, 4.78, 1.57, 1.2, 1.01, 1.15, 0.93, 1.06, 0.69, 0.83, 0.69, 0.56, 0.55, 0.61, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/cEPa4RFLJ-0_filtered.json b/annotations_filtered/cEPa4RFLJ-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3302e9f5f4ab8d80459c2aa04dd02bb93d653ffd --- /dev/null +++ b/annotations_filtered/cEPa4RFLJ-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.01], [23.0, 27.13], [30.0, 30.82], [32.0, 33.27], [35.0, 35.75], [37.0, 37.89], [38.0, 38.35], [44.0, 44.71], [46.0, 47.21], [49.0, 49.67], [52.0, 53.15], [59.0, 59.43], [63.0, 64.35], [66.0, 67.36], [71.0, 70.83], [73.0, 74.34], [75.0, 75.57], [76.0, 77.9], [84.0, 85.68], [87.0, 93.5], [94.0, 95.84], [96.0, 104.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [60.23, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.95, 0.0, 37.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.81], ["speech", 14.7], ["inside, small room", 4.15]], null, [["music", 55.03], ["hum", 6.88], ["synthesizer", 6.68]]], "duration": [2.01, 4.13, 0.82, 1.27, 0.75, 0.89, 0.35, 0.71, 1.21, 0.67, 1.15, 0.43, 1.35, 1.36, -0.17, 1.34, 0.57, 1.9, 1.68, 6.5, 1.84, 8.95]} \ No newline at end of file diff --git a/annotations_filtered/cETZjbXsUog_filtered.json b/annotations_filtered/cETZjbXsUog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..461214823e607d76b8286c97d4af21f817eef8bb --- /dev/null +++ b/annotations_filtered/cETZjbXsUog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [7.0, 6.93], [8.0, 8.77], [10.0, 10.62], [12.0, 12.65], [21.0, 30.74], [31.0, 30.77], [31.0, 31.58], [32.0, 32.66], [34.0, 35.18], [38.0, 39.06], [40.0, 42.11], [43.0, 43.21], [44.0, 44.46], [51.0, 51.95], [61.0, 61.84], [62.0, 62.78], [63.0, 64.1], [64.0, 76.49], [77.0, 78.24], [80.0, 80.62], [85.0, 85.65], [88.0, 94.76], [96.0, 97.16], [100.0, 107.37]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.7, 0.0, 0.0, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 91.3, 0.0, 48.02], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 11.98], ["music", 9.42], ["speech", 8.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 32.94], ["mains hum", 18.12], ["effects unit", 10.76]]], "duration": [0.73, -0.07, 0.77, 0.62, 0.65, 9.74, -0.23, 0.58, 0.66, 1.18, 1.06, 2.11, 0.21, 0.46, 0.95, 0.84, 0.78, 1.1, 12.49, 1.24, 0.62, 0.65, 6.76, 1.16, 7.37]} \ No newline at end of file diff --git a/annotations_filtered/cEafT-GQfv4_filtered.json b/annotations_filtered/cEafT-GQfv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a593019e4d5e5f16b9f7dd4bc8e8cbcfd6429b8f --- /dev/null +++ b/annotations_filtered/cEafT-GQfv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.06], [23.0, 23.97], [27.0, 27.57], [32.0, 32.56], [46.0, 55.65], [59.0, 60.66], [73.0, 73.5], [75.0, 75.76], [78.0, 77.82], [80.0, 80.45], [83.0, 84.69], [89.0, 91.34], [92.0, 93.11]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 0.0, 30.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0], "audiomae_on_audioset": [null, null, null, null, [["gunshot, gunfire", 30.5], ["speech", 28.49], ["explosion", 8.66]], null, null, null, null, null, null, null, null], "duration": [2.06, 0.97, 0.57, 0.56, 9.65, 1.66, 0.5, 0.76, -0.18, 0.45, 1.69, 2.34, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/cEezHIqQrEw_filtered.json b/annotations_filtered/cEezHIqQrEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..357ecfa23c0ff1625efca29f0790bb4d21b16475 --- /dev/null +++ b/annotations_filtered/cEezHIqQrEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.44], [7.0, 8.33], [12.0, 12.48], [18.0, 20.36], [23.0, 25.57], [31.0, 31.13], [34.0, 34.77], [39.0, 40.93], [42.0, 42.55], [43.0, 47.66], [49.0, 49.91], [55.0, 75.78], [81.0, 85.51], [86.0, 87.32], [88.0, 96.74], [102.0, 113.61], [115.0, 115.32]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 84.62, 82.25, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 32.61, 34.43, 0.0, 33.8, 34.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 38.7], ["fly, housefly", 17.32], ["insect", 13.45]], null, [["noise", 13.41], ["radio", 11.85], ["music", 11.28]], [["vehicle", 16.58], ["car", 9.29], ["race car, auto racing", 7.21]], null, [["speech", 44.44], ["noise", 11.24], ["vehicle", 9.11]], [["music", 12.98], ["cacophony", 9.19], ["vehicle", 7.11]], null], "duration": [1.44, 1.33, 0.48, 2.36, 2.57, 0.13, 0.77, 1.93, 0.55, 4.66, 0.91, 20.78, 4.51, 1.32, 8.74, 11.61, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/cEjo0ajod1M_filtered.json b/annotations_filtered/cEjo0ajod1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76f54cce2415ee24d4786f0d881e3191fe3d778e --- /dev/null +++ b/annotations_filtered/cEjo0ajod1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.55], [18.0, 18.81], [22.0, 22.62], [27.0, 28.58], [42.0, 42.57], [63.0, 63.66], [70.0, 70.46], [72.0, 72.4], [75.0, 75.36], [76.0, 77.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.81, 0.62, 1.58, 0.57, 0.66, 0.46, 0.4, 0.36, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/cErG8_neSa4_filtered.json b/annotations_filtered/cErG8_neSa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f696f5322cf3c50090c1c1fde3b956c97e59c5c --- /dev/null +++ b/annotations_filtered/cErG8_neSa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [4.0, 15.36], [17.0, 16.98], [17.0, 19.74], [22.0, 25.88], [27.0, 27.73], [30.0, 30.05], [32.0, 32.34], [35.0, 35.56], [37.0, 39.85], [40.0, 40.93], [43.0, 42.69], [45.0, 48.07], [53.0, 54.08], [56.0, 57.37], [62.0, 63.71], [65.0, 68.72], [71.0, 72.67], [76.0, 78.51], [85.0, 85.28], [92.0, 96.11], [98.0, 98.34], [103.0, 104.28], [106.0, 106.96], [109.0, 109.12], [109.0, 109.78], [111.0, 111.72], [114.0, 114.34], [115.0, 116.02], [118.0, 118.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.96, 0.0, 99.8, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 11.36, -0.02, 2.74, 3.88, 0.73, 0.05, 0.34, 0.56, 2.85, 0.93, -0.31, 3.07, 1.08, 1.37, 1.71, 3.72, 1.67, 2.51, 0.28, 4.11, 0.34, 1.28, 0.96, 0.12, 0.78, 0.72, 0.34, 1.02, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/cFVtyYzs48I_filtered.json b/annotations_filtered/cFVtyYzs48I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532237dde769f50c5b1f35357b4d31929c14c916 --- /dev/null +++ b/annotations_filtered/cFVtyYzs48I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [10.0, 9.86], [16.0, 16.83], [18.0, 96.62], [99.0, 114.62], [116.0, 116.36], [118.0, 120.85], [126.0, 126.39], [129.0, 130.15]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 61.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 12.56], ["livestock, farm animals, working animals", 10.65], ["rumble", 7.98]], null, null, null, null], "duration": [0.35, -0.14, 0.83, 78.62, 15.62, 0.36, 2.85, 0.39, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/cFZWNfXzFLU_filtered.json b/annotations_filtered/cFZWNfXzFLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7fdfe69dfdf90bad263f33a603457ecc8668d62 --- /dev/null +++ b/annotations_filtered/cFZWNfXzFLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.65], [6.0, 8.9], [9.0, 10.02], [15.0, 16.48], [19.0, 19.82], [22.0, 23.01], [24.0, 24.65], [25.0, 25.64], [28.0, 28.04], [29.0, 29.62], [36.0, 36.86], [38.0, 38.85], [40.0, 40.83], [41.0, 41.54], [43.0, 44.09], [46.0, 47.53], [50.0, 50.79], [53.0, 55.04], [58.0, 58.83], [62.0, 62.51], [63.0, 66.46], [69.0, 70.06], [74.0, 74.36], [77.0, 77.18], [80.0, 81.95], [83.0, 83.25], [84.0, 84.48], [88.0, 88.2], [89.0, 90.09], [92.0, 94.26], [95.0, 97.48], [98.0, 98.86], [101.0, 101.44], [103.0, 103.47], [104.0, 108.13], [110.0, 112.29], [115.0, 116.04], [117.0, 118.56], [120.0, 123.06], [124.0, 125.02], [125.0, 127.75], [130.0, 130.91], [136.0, 137.17], [138.0, 139.01], [141.0, 141.2], [142.0, 142.16], [143.0, 146.6], [148.0, 151.26], [160.0, 164.47], [167.0, 168.3], [174.0, 174.8], [179.0, 179.25], [181.0, 183.27], [184.0, 186.6], [187.0, 190.27], [193.0, 194.98], [196.0, 197.97], [198.0, 202.22], [205.0, 205.19], [207.0, 208.9], [213.0, 214.46], [215.0, 217.24], [219.0, 220.18], [227.0, 227.58], [228.0, 228.8], [230.0, 230.93], [232.0, 232.44], [236.0, 236.66], [238.0, 239.18], [240.0, 240.93], [244.0, 244.44], [245.0, 247.36]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 96.29, 0.0, 0.0, 0.0, 53.97, 38.46, 0.0, 0.0, 34.02, 0.0, 32.33, 0.0, 0.0, 0.0, 0.0, 0.0, 33.78, 38.82, 35.33, 0.0, 0.0, 0.0, 39.55, 33.36, 35.74, 0.0, 0.0, 34.93, 0.0, 0.0, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.1], "audiomae_on_audioset": [null, [["radio", 12.52], ["noise", 12.13], ["sidetone", 11.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.81], ["clarinet", 24.9], ["musical instrument", 8.37]], null, null, [["music", 43.31], ["whale vocalization", 12.27], ["theremin", 11.2]], null, [["music", 40.52], ["theremin", 6.43], ["musical instrument", 4.99]], null, null, null, null, null, [["music", 34.99], ["theremin", 9.85], ["guitar", 8.45]], [["music", 72.66], ["musical instrument", 7.52], ["synthesizer", 4.22]], [["music", 36.1], ["guitar", 23.91], ["musical instrument", 11.41]], null, null, null, [["didgeridoo", 42.59], ["music", 33.31], ["musical instrument", 2.43]], [["music", 24.46], ["foghorn", 11.57], ["theremin", 5.91]], [["music", 34.83], ["theremin", 27.46], ["wind instrument, woodwind instrument", 3.5]], null, null, [["music", 26.8], ["howl", 9.94], ["brass instrument", 8.73]], null, null, null, [["music", 34.09], ["didgeridoo", 6.34], ["musical instrument", 6.09]], null, null, null, null, null, null, null, null, null, [["music", 52.61], ["guitar", 10.56], ["musical instrument", 9.7]]], "duration": [3.65, 2.9, 1.02, 1.48, 0.82, 1.01, 0.65, 0.64, 0.04, 0.62, 0.86, 0.85, 0.83, 0.54, 1.09, 1.53, 0.79, 2.04, 0.83, 0.51, 3.46, 1.06, 0.36, 0.18, 1.95, 0.25, 0.48, 0.2, 1.09, 2.26, 2.48, 0.86, 0.44, 0.47, 4.13, 2.29, 1.04, 1.56, 3.06, 1.02, 2.75, 0.91, 1.17, 1.01, 0.2, 0.16, 3.6, 3.26, 4.47, 1.3, 0.8, 0.25, 2.27, 2.6, 3.27, 1.98, 1.97, 4.22, 0.19, 1.9, 1.46, 2.24, 1.18, 0.58, 0.8, 0.93, 0.44, 0.66, 1.18, 0.93, 0.44, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/cFvxjIsjwoc_filtered.json b/annotations_filtered/cFvxjIsjwoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db576c8f03a3ca82d4ccfd6d393e0e888142b493 --- /dev/null +++ b/annotations_filtered/cFvxjIsjwoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.07], [26.0, 26.92], [29.0, 28.63], [30.0, 30.82], [31.0, 31.09], [33.0, 33.78], [37.0, 36.81], [38.0, 38.42], [39.0, 39.06], [41.0, 45.87], [48.0, 48.15], [49.0, 54.65], [60.0, 77.33], [78.0, 78.71], [81.0, 82.14], [86.0, 86.98], [88.0, 88.8], [91.0, 91.62], [95.0, 94.68], [98.0, 98.24], [104.0, 104.46], [109.0, 110.13], [110.0, 115.21], [116.0, 116.06], [118.0, 117.69], [122.0, 123.43], [127.0, 126.91], [130.0, 131.19], [147.0, 148.49], [149.0, 150.67], [154.0, 155.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.94, 0.0, 37.26, 44.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 67.97], ["thunk", 6.9], ["whack, thwack", 4.58]], null, [["speech", 80.64], ["crushing", 6.57], ["fart", 1.42]], [["music", 35.42], ["crushing", 14.82], ["theremin", 12.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 0.92, -0.37, 0.82, 0.09, 0.78, -0.19, 0.42, 0.06, 4.87, 0.15, 5.65, 17.33, 0.71, 1.14, 0.98, 0.8, 0.62, -0.32, 0.24, 0.46, 1.13, 5.21, 0.06, -0.31, 1.43, -0.09, 1.19, 1.49, 1.67, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/cFzsm8tKWU0_filtered.json b/annotations_filtered/cFzsm8tKWU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bd5d51a134d3061358941b1f5e9c5bb133636d7 --- /dev/null +++ b/annotations_filtered/cFzsm8tKWU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [9.0, 13.47], [18.0, 18.13], [24.0, 24.83], [27.0, 27.51], [30.0, 31.09], [33.0, 33.56], [37.0, 38.2], [40.0, 41.05], [42.0, 44.25], [47.0, 52.56], [54.0, 56.94], [62.0, 66.02], [73.0, 74.63], [75.0, 74.87], [84.0, 85.11], [86.0, 89.26], [90.0, 92.42], [95.0, 97.73], [98.0, 111.43], [112.0, 112.62], [115.0, 116.11], [124.0, 127.45], [128.0, 128.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 37.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 35.62, 32.61, 32.49, 0.0, 0.0, 0.0, 38.15, 94.07, 99.62, 46.83, 0.0, 0.0, 39.27, 0.0], "audiomae_on_audioset": [null, [["music", 71.63], ["carnatic music", 6.6], ["musical instrument", 2.52]], null, null, null, null, null, null, null, null, [["music", 57.88], ["theremin", 27.07], ["musical instrument", 2.94]], [["music", 69.8], ["theremin", 21.9], ["musical instrument", 2.68]], [["theremin", 63.67], ["music", 23.7], ["effects unit", 2.89]], null, null, null, [["music", 47.33], ["humming", 2.52], ["vocal music", 2.18]], null, null, [["music", 50.83], ["synthesizer", 6.9], ["gong", 5.68]], null, null, [["theremin", 92.61], ["music", 5.72], ["musical instrument", 0.21]], null], "duration": [0.49, 4.47, 0.13, 0.83, 0.51, 1.09, 0.56, 1.2, 1.05, 2.25, 5.56, 2.94, 4.02, 1.63, -0.13, 1.11, 3.26, 2.42, 2.73, 13.43, 0.62, 1.11, 3.45, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/cG0ZIxenJY8_filtered.json b/annotations_filtered/cG0ZIxenJY8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..490c2d88ee0fd3883de95a59bd060b29c681015e --- /dev/null +++ b/annotations_filtered/cG0ZIxenJY8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.46], [25.0, 25.84], [39.0, 39.12], [46.0, 47.14], [53.0, 55.19], [56.0, 57.23], [59.0, 61.53], [63.0, 62.94], [63.0, 64.17], [67.0, 81.63], [82.0, 84.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 68.02, 0.0, 0.0, 86.45, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 0.84, 0.12, 1.14, 2.19, 1.23, 2.53, -0.06, 1.17, 14.63, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/cGDwEP-RWHo_filtered.json b/annotations_filtered/cGDwEP-RWHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..204950bfb8db841b14ee77ae852552e095c4c98e --- /dev/null +++ b/annotations_filtered/cGDwEP-RWHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [5.0, 5.49], [8.0, 11.03], [12.0, 17.37], [19.0, 23.11], [24.0, 26.99], [28.0, 29.61], [31.0, 33.32], [34.0, 38.01], [39.0, 45.33], [47.0, 50.9], [52.0, 55.31], [57.0, 74.68], [77.0, 80.0], [81.0, 83.51], [87.0, 93.77], [95.0, 97.9], [99.0, 100.75], [101.0, 102.71], [105.0, 106.81], [111.0, 115.32], [117.0, 122.74], [124.0, 173.72], [174.0, 175.68], [176.0, 178.14]], "keep_status": [false, false, true, true, true, true, false, true, true, true, true, false, true, false, false, false, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 36.52, 31.17, 34.1, 37.08, 0.0, 33.99, 34.72, 29.68, 33.14, 37.8, 46.72, 50.56, 46.43, 30.36, 38.93, 0.0, 0.0, 0.0, 38.41, 32.84, 0.0, 0.0, 37.66], "audiomae_on_audioset": [null, null, [["hum", 16.73], ["music", 15.82], ["chirp tone", 10.9]], [["creak", 28.1], ["speech", 9.43], ["mechanisms", 8.27]], [["hum", 29.89], ["music", 8.9], ["chirp tone", 6.75]], [["music", 21.16], ["hum", 20.4], ["sine wave", 7.14]], null, [["hum", 30.15], ["mains hum", 20.68], ["music", 9.61]], [["speech", 46.07], ["hum", 9.52], ["rumble", 8.56]], [["speech", 21.7], ["sine wave", 19.1], ["chirp tone", 6.4]], [["rumble", 50.68], ["hum", 5.46], ["music", 5.26]], [["hum", 40.5], ["throbbing", 33.09], ["mains hum", 13.85]], [["coin (dropping)", 16.53], ["music", 6.33], ["speech", 5.9]], null, [["hum", 43.79], ["throbbing", 28.44], ["mains hum", 11.35]], [["hum", 38.71], ["throbbing", 21.42], ["mains hum", 15.03]], [["music", 19.81], ["gong", 17.68], ["hum", 17.62]], null, null, null, [["hum", 47.99], ["mains hum", 12.96], ["music", 6.14]], [["music", 28.39], ["hum", 25.52], ["mains hum", 5.22]], null, null, [["rumble", 31.7], ["hum", 11.97], ["eruption", 9.58]]], "duration": [0.24, 0.49, 3.03, 5.37, 4.11, 2.99, 1.61, 2.32, 4.01, 6.33, 3.9, 3.31, 17.68, 3.0, 2.51, 6.77, 2.9, 1.75, 1.71, 1.81, 4.32, 5.74, 49.72, 1.68, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/cGP9TwLnG78_filtered.json b/annotations_filtered/cGP9TwLnG78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac9231f80a76e6d60e4546709910f43c848debc5 --- /dev/null +++ b/annotations_filtered/cGP9TwLnG78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.32], [7.0, 8.29], [11.0, 10.67], [11.0, 12.51], [13.0, 14.13], [15.0, 15.4], [16.0, 16.8], [24.0, 24.88], [27.0, 28.58], [30.0, 34.52], [37.0, 38.45], [39.0, 40.26], [42.0, 42.89], [44.0, 44.1], [44.0, 46.01], [46.0, 49.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 56.55, 42.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.79], ["sidetone", 11.03], ["sine wave", 10.44]]], "duration": [1.32, 1.29, -0.33, 1.51, 1.13, 0.4, 0.8, 0.88, 1.58, 4.52, 1.45, 1.26, 0.89, 0.1, 2.01, 3.65]} \ No newline at end of file diff --git a/annotations_filtered/cGTn7aRFttk_filtered.json b/annotations_filtered/cGTn7aRFttk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41bfb97dec5f781f835fec7824817834878434a --- /dev/null +++ b/annotations_filtered/cGTn7aRFttk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.61], [71.0, 70.73], [73.0, 73.72], [86.0, 91.64], [99.0, 100.14], [111.0, 112.51], [116.0, 116.31]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 48.09], ["mains hum", 16.52], ["noise", 9.48]], null, null, null], "duration": [1.61, -0.27, 0.72, 5.64, 1.14, 1.51, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/cGbTf-FgG-M_filtered.json b/annotations_filtered/cGbTf-FgG-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8019cf7e7ab8677cb86fef55b6e985b5c5e6bc57 --- /dev/null +++ b/annotations_filtered/cGbTf-FgG-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.23], [18.0, 23.68], [25.0, 75.15], [76.0, 82.39], [83.0, 84.21]], "keep_status": [false, false, false, false, false], "silence_prob": [31.55, 48.31, 0.0, 91.98, 0.0], "audiomae_on_audioset": [[["speech", 61.1], ["explosion", 6.45], ["music", 4.43]], [["speech", 83.16], ["inside, small room", 2.33], ["frog", 0.89]], null, null, null], "duration": [5.23, 5.68, 50.15, 6.39, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/cGd2BBjzb0Y_filtered.json b/annotations_filtered/cGd2BBjzb0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af7efe957e4a9292d1a90fdc436a71cf65aa69d --- /dev/null +++ b/annotations_filtered/cGd2BBjzb0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 11.84], [12.0, 14.5], [15.0, 16.12], [17.0, 18.94], [22.0, 22.67], [28.0, 32.14], [37.0, 38.57], [39.0, 38.75], [42.0, 42.52], [44.0, 44.76], [47.0, 48.52]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 42.67, 39.58, 0.0, 0.0, 0.0, 35.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["bee, wasp, etc.", 37.64], ["fly, housefly", 23.44], ["insect", 11.21]], [["fly, housefly", 56.63], ["bee, wasp, etc.", 19.92], ["insect", 17.13]], null, null, null, [["speech", 33.37], ["sidetone", 12.49], ["fly, housefly", 4.77]], null, null, null, null, null], "duration": [0.6, 6.84, 2.5, 1.12, 1.94, 0.67, 4.14, 1.57, -0.25, 0.52, 0.76, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/cGgPJKE_jSs_filtered.json b/annotations_filtered/cGgPJKE_jSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffdb20366d5201989e872bed669e0f91aa34abc7 --- /dev/null +++ b/annotations_filtered/cGgPJKE_jSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.53], [22.0, 38.74], [39.0, 38.77], [39.0, 39.82], [40.0, 40.9], [46.0, 51.98], [53.0, 54.3], [59.0, 60.54], [68.0, 77.35]], "keep_status": [false, true, false, false, false, true, false, false, false], "silence_prob": [46.64, 38.33, 0.0, 0.0, 0.0, 38.62, 0.0, 0.0, 37.4], "audiomae_on_audioset": [[["music", 60.05], ["musical instrument", 6.51], ["synthesizer", 5.13]], [["music", 52.06], ["percussion", 10.57], ["wood block", 6.68]], null, null, null, [["music", 58.84], ["percussion", 5.16], ["musical instrument", 4.64]], null, null, [["music", 77.01], ["swing music", 3.5], ["musical instrument", 2.22]]], "duration": [2.53, 16.74, -0.23, 0.82, 0.9, 5.98, 1.3, 1.54, 9.35]} \ No newline at end of file diff --git a/annotations_filtered/cH8W_cTQQvw_filtered.json b/annotations_filtered/cH8W_cTQQvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04053128f969048c3058f625ab7f8dbe6456495 --- /dev/null +++ b/annotations_filtered/cH8W_cTQQvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.62], [4.0, 5.73], [6.0, 7.16], [13.0, 14.07], [16.0, 16.68], [20.0, 21.69], [31.0, 32.27], [48.0, 49.65], [51.0, 52.12], [59.0, 59.09], [62.0, 62.48], [71.0, 72.59], [74.0, 75.17], [78.0, 85.87], [96.0, 96.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.13], ["musical instrument", 9.69], ["brass instrument", 7.25]], null], "duration": [1.62, 1.73, 1.16, 1.07, 0.68, 1.69, 1.27, 1.65, 1.12, 0.09, 0.48, 1.59, 1.17, 7.87, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/cHQcdgc_Whk_filtered.json b/annotations_filtered/cHQcdgc_Whk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37701563ae6aceb6716f75b13909873114a5b5f --- /dev/null +++ b/annotations_filtered/cHQcdgc_Whk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 4.21], [5.0, 5.48], [8.0, 8.23], [10.0, 10.54], [19.0, 19.33], [21.0, 21.84], [25.0, 25.2], [26.0, 26.11], [27.0, 27.03], [28.0, 28.7], [32.0, 32.73], [35.0, 36.53], [37.0, 37.86], [39.0, 39.87], [42.0, 42.52], [43.0, 43.29], [45.0, 45.44], [47.0, 47.24], [48.0, 48.88], [53.0, 53.32], [59.0, 58.73], [63.0, 63.44], [64.0, 64.69], [67.0, 67.17], [70.0, 69.9], [79.0, 79.51], [80.0, 80.01], [81.0, 81.57], [82.0, 82.26], [83.0, 83.46], [84.0, 84.45], [91.0, 91.67], [92.0, 92.31], [93.0, 93.41], [94.0, 94.91], [95.0, 96.36], [97.0, 98.05], [98.0, 99.28], [101.0, 101.33], [107.0, 107.45], [108.0, 108.51], [110.0, 111.84], [113.0, 112.78], [113.0, 113.36], [120.0, 120.34], [122.0, 123.15], [123.0, 124.12], [125.0, 125.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 1.21, 0.48, 0.23, 0.54, 0.33, 0.84, 0.2, 0.11, 0.03, 0.7, 0.73, 1.53, 0.86, 0.87, 0.52, 0.29, 0.44, 0.24, 0.88, 0.32, -0.27, 0.44, 0.69, 0.17, -0.1, 0.51, 0.01, 0.57, 0.26, 0.46, 0.45, 0.67, 0.31, 0.41, 0.91, 1.36, 1.05, 1.28, 0.33, 0.45, 0.51, 1.84, -0.22, 0.36, 0.34, 1.15, 1.12, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/cHT2zdQT3Ps_filtered.json b/annotations_filtered/cHT2zdQT3Ps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75f152cb8a3187f5b8bf0e87814580fed31408d7 --- /dev/null +++ b/annotations_filtered/cHT2zdQT3Ps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.49], [14.0, 15.77], [17.0, 20.12], [29.0, 32.61], [34.0, 35.24], [42.0, 42.09], [43.0, 49.13], [49.0, 49.87], [54.0, 54.45], [55.0, 71.9], [72.0, 79.93], [81.0, 81.8], [82.0, 102.71], [104.0, 104.06], [105.0, 113.51], [114.0, 117.31], [120.0, 120.5], [125.0, 126.39]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [42.26, 0.0, 95.09, 40.77, 0.0, 0.0, 36.8, 0.0, 0.0, 29.63, 45.82, 0.0, 36.48, 0.0, 41.98, 55.04, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 20.43], ["fly, housefly", 13.62], ["fart", 7.91]], null, null, [["speech", 63.15], ["didgeridoo", 13.18], ["music", 7.59]], null, null, [["speech", 58.26], ["grunt", 9.3], ["music", 3.29]], null, null, [["speech", 70.38], ["music", 12.44], ["thump, thud", 2.22]], [["speech", 15.83], ["cattle, bovinae", 10.03], ["animal", 6.35]], null, [["music", 32.75], ["hum", 21.5], ["sidetone", 13.79]], null, [["fart", 54.34], ["speech", 21.93], ["fly, housefly", 3.58]], null, null, null], "duration": [8.49, 1.77, 3.12, 3.61, 1.24, 0.09, 6.13, 0.87, 0.45, 16.9, 7.93, 0.8, 20.71, 0.06, 8.51, 3.31, 0.5, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/cIE1fT395HM_filtered.json b/annotations_filtered/cIE1fT395HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a113b94f969d598ee36af9ce2def2d40f5b52bec --- /dev/null +++ b/annotations_filtered/cIE1fT395HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.9], [10.0, 10.5], [17.0, 29.96], [32.0, 32.34], [33.0, 33.76], [47.0, 47.75], [49.0, 50.33], [52.0, 52.69], [60.0, 60.71], [69.0, 69.94], [75.0, 75.66], [76.0, 77.43], [82.0, 83.24], [84.0, 84.0], [89.0, 91.86], [92.0, 94.04], [97.0, 101.82], [108.0, 111.96], [115.0, 114.89], [115.0, 116.97], [119.0, 118.83], [120.0, 119.82], [121.0, 121.59], [123.0, 123.11], [124.0, 127.3]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 99.68, 37.92, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["animal", 16.6], ["speech", 14.97], ["livestock, farm animals, working animals", 12.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["neigh, whinny", 44.63], ["horse", 36.58], ["animal", 15.02]], null, null, null, null, null, null, null, null], "duration": [0.9, 0.5, 12.96, 0.34, 0.76, 0.75, 1.33, 0.69, 0.71, 0.94, 0.66, 1.43, 1.24, 0.0, 2.86, 2.04, 4.82, 3.96, -0.11, 1.97, -0.17, -0.18, 0.59, 0.11, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/cIEPiYHzTto_filtered.json b/annotations_filtered/cIEPiYHzTto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60d455a54a2f9fac92dcaee12c37f7f11a0175eb --- /dev/null +++ b/annotations_filtered/cIEPiYHzTto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 34.89], [42.0, 42.62], [52.0, 52.66], [62.0, 68.23], [68.0, 68.35], [87.0, 99.62], [103.0, 105.09]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [29.8, 0.0, 0.0, 29.85, 0.0, 29.37, 29.8], "audiomae_on_audioset": [[["music", 60.85], ["drum machine", 12.11], ["synthesizer", 5.8]], null, null, [["music", 88.8], ["hip hop music", 1.75], ["scratching (performance technique)", 1.21]], null, [["music", 65.0], ["hum", 6.69], ["electronic music", 3.62]], [["music", 46.23], ["speech", 15.46], ["electronic music", 2.51]]], "duration": [23.89, 0.62, 0.66, 6.23, 0.35, 12.62, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/cIG0COsZmjg_filtered.json b/annotations_filtered/cIG0COsZmjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ac71a0c12c27f8773b22cdbd6dcf688256e3944 --- /dev/null +++ b/annotations_filtered/cIG0COsZmjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.5], [8.0, 17.19], [18.0, 18.89], [20.0, 21.02], [22.0, 24.29], [25.0, 27.58], [28.0, 29.3], [31.0, 33.54], [34.0, 36.42], [38.0, 42.79], [44.0, 45.99], [47.0, 47.97], [48.0, 53.32], [54.0, 54.46], [56.0, 57.33], [59.0, 59.71], [60.0, 60.72], [63.0, 63.02], [66.0, 81.38], [85.0, 93.55], [94.0, 100.8], [101.0, 102.49], [103.0, 104.33], [105.0, 105.34], [106.0, 107.37], [108.0, 108.08], [112.0, 113.61], [115.0, 116.8], [119.0, 118.94], [121.0, 121.73], [122.0, 122.64], [127.0, 131.48], [131.0, 131.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [97.22, 98.19, 0.0, 0.0, 54.23, 74.92, 0.0, 98.01, 68.93, 99.97, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 42.84, 99.84, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.59], ["speech", 13.11], ["boing", 10.08]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.48], ["speech", 12.64], ["whale vocalization", 11.35]], null], "duration": [4.5, 9.19, 0.89, 1.02, 2.29, 2.58, 1.3, 2.54, 2.42, 4.79, 1.99, 0.97, 5.32, 0.46, 1.33, 0.71, 0.72, 0.02, 15.38, 8.55, 6.8, 1.49, 1.33, 0.34, 1.37, 0.08, 1.61, 1.8, -0.06, 0.73, 0.64, 4.48, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/cINFeXqwbDo_filtered.json b/annotations_filtered/cINFeXqwbDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e18f60cd3fb402a54ac923ff9e5ec09400dd87e --- /dev/null +++ b/annotations_filtered/cINFeXqwbDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.28], [28.0, 27.94], [28.0, 28.75], [31.0, 78.73], [82.0, 90.32], [91.0, 94.64], [96.0, 95.94], [99.0, 105.43], [107.0, 118.29], [119.0, 119.84], [121.0, 152.86], [155.0, 155.33], [158.0, 158.26], [160.0, 175.51]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [60.79, 0.0, 0.0, 0.0, 48.95, 45.27, 0.0, 48.35, 40.71, 0.0, 0.0, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 32.41], ["electric shaver, electric razor", 15.75], ["noise", 11.27]], [["cattle, bovinae", 33.01], ["livestock, farm animals, working animals", 30.26], ["moo", 21.47]], null, [["electric shaver, electric razor", 52.82], ["radio", 16.65], ["music", 4.62]], [["speech", 34.16], ["frog", 18.48], ["radio", 9.41]], null, null, null, null, [["music", 59.31], ["speech", 20.01], ["electric shaver, electric razor", 4.19]]], "duration": [9.28, -0.06, 0.75, 47.73, 8.32, 3.64, -0.06, 6.43, 11.29, 0.84, 31.86, 0.33, 0.26, 15.51]} \ No newline at end of file diff --git a/annotations_filtered/cIRL7jMVh8Q_filtered.json b/annotations_filtered/cIRL7jMVh8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef3ccfb3cafb2c37c66323210b551aadc95f2280 --- /dev/null +++ b/annotations_filtered/cIRL7jMVh8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.41], [14.0, 19.38], [21.0, 20.95], [22.0, 23.94], [28.0, 53.03], [57.0, 57.37], [59.0, 60.79], [61.0, 81.99], [82.0, 117.76], [118.0, 120.87], [121.0, 120.99], [121.0, 121.2], [121.0, 122.5], [127.0, 173.53]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 35.22, 0.0, 0.0, 30.33, 0.0, 0.0, 51.82, 0.0, 42.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 45.22], ["hum", 7.25], ["music", 6.56]], null, null, [["music", 31.85], ["throbbing", 26.49], ["hum", 19.15]], null, null, null, null, [["music", 46.33], ["hum", 12.28], ["ambient music", 8.53]], null, null, null, null], "duration": [1.41, 5.38, -0.05, 1.94, 25.03, 0.37, 1.79, 20.99, 35.76, 2.87, -0.01, 0.2, 1.5, 46.53]} \ No newline at end of file diff --git a/annotations_filtered/cIiMDK4UMQM_filtered.json b/annotations_filtered/cIiMDK4UMQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0b1df743b876111e9d29a9d7b3631c0c55f452 --- /dev/null +++ b/annotations_filtered/cIiMDK4UMQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [5.0, 5.58], [6.0, 5.81], [7.0, 7.06], [7.0, 7.82], [9.0, 9.78], [13.0, 19.3], [20.0, 20.92], [23.0, 26.49], [28.0, 30.13], [30.0, 33.96], [35.0, 43.41], [46.0, 71.34], [72.0, 104.25], [106.0, 107.33]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 79.07, 45.92, 49.13, 48.1, 55.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 14.55], ["fly, housefly", 10.85], ["mosquito", 8.77]], [["speech", 61.54], ["sidetone", 18.22], ["dial tone", 5.96]], [["whale vocalization", 88.04], ["sidetone", 1.32], ["noise", 1.26]], null, null, null], "duration": [1.55, 0.58, -0.19, 0.06, 0.82, 0.78, 6.3, 0.92, 3.49, 2.13, 3.96, 8.41, 25.34, 32.25, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/cIscGgQD4uE_filtered.json b/annotations_filtered/cIscGgQD4uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fad7cc545cad756f5695a8f1c8a0189ddb39af1 --- /dev/null +++ b/annotations_filtered/cIscGgQD4uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.75], [16.0, 16.88], [20.0, 19.82], [31.0, 37.44], [41.0, 41.91], [46.0, 46.38], [48.0, 48.69], [56.0, 57.15], [59.0, 61.03], [61.0, 62.18], [76.0, 80.42], [84.0, 85.94], [89.0, 90.02], [95.0, 95.99], [99.0, 110.91], [111.0, 113.97], [114.0, 115.53], [119.0, 119.04], [122.0, 123.36], [124.0, 124.8], [127.0, 128.26], [128.0, 129.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 35.19, 0.0, 0.0, 0.0, 32.79, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 22.32], ["livestock, farm animals, working animals", 21.71], ["moo", 20.69]], null, null, null, null, null, null, [["music", 74.71], ["musical instrument", 7.88], ["singing", 2.44]], null, null, null, [["music", 78.48], ["speech", 3.2], ["electronic music", 2.13]], [["speech", 45.54], ["music", 16.12], ["moo", 6.57]], null, null, null, null, null, null], "duration": [1.75, 0.88, -0.18, 6.44, 0.91, 0.38, 0.69, 1.15, 2.03, 1.18, 4.42, 1.94, 1.02, 0.99, 11.91, 2.97, 1.53, 0.04, 1.36, 0.8, 1.26, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/cJ4mSB-0OA0_filtered.json b/annotations_filtered/cJ4mSB-0OA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6f0227600ea962dbbd06269fd714bb2c19d8859 --- /dev/null +++ b/annotations_filtered/cJ4mSB-0OA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 46.28], [50.0, 51.65], [53.0, 53.76], [55.0, 55.0], [76.0, 76.86], [79.0, 80.15], [87.0, 87.35], [95.0, 97.39], [118.0, 118.61], [120.0, 119.94], [120.0, 120.95], [131.0, 131.73], [136.0, 136.39], [161.0, 165.64]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [[["hum", 44.41], ["speech", 10.71], ["mains hum", 9.23]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.28, 1.65, 0.76, 0.0, 0.86, 1.15, 0.35, 2.39, 0.61, -0.06, 0.95, 0.73, 0.39, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/cJOqz6CPxLY_filtered.json b/annotations_filtered/cJOqz6CPxLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbbfeb9abf0fe6b2318fb921d2869aa6f9245543 --- /dev/null +++ b/annotations_filtered/cJOqz6CPxLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.09], [10.0, 16.56], [19.0, 22.35], [23.0, 28.38], [29.0, 29.94], [33.0, 33.74], [36.0, 36.05], [37.0, 38.57], [52.0, 53.0], [62.0, 64.99], [67.0, 70.14], [72.0, 72.12], [76.0, 87.42], [88.0, 89.16], [90.0, 91.47], [93.0, 96.03], [97.0, 97.65], [103.0, 103.4], [106.0, 106.52], [110.0, 110.94], [115.0, 117.73], [120.0, 123.8]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.96, 99.99, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 43.77, 80.82, 0.0, 87.74, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 99.96, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 30.31], ["livestock, farm animals, working animals", 14.92], ["cattle, bovinae", 9.11]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 6.56, 3.35, 5.38, 0.94, 0.74, 0.05, 1.57, 1.0, 2.99, 3.14, 0.12, 11.42, 1.16, 1.47, 3.03, 0.65, 0.4, 0.52, 0.94, 2.73, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/cJYwpfA3HWY_filtered.json b/annotations_filtered/cJYwpfA3HWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c446be59c821fc819dc750859f71032be0efa658 --- /dev/null +++ b/annotations_filtered/cJYwpfA3HWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.21], [22.0, 28.46], [29.0, 29.02], [29.0, 29.44], [29.0, 29.66], [31.0, 31.92], [33.0, 34.03], [37.0, 37.79], [38.0, 42.08], [43.0, 42.89], [43.0, 45.67], [46.0, 49.35], [50.0, 57.52], [60.0, 60.03], [62.0, 62.02], [65.0, 67.34], [68.0, 72.55], [74.0, 82.68], [84.0, 84.42], [85.0, 86.19], [88.0, 87.98], [88.0, 88.72], [95.0, 95.07], [96.0, 97.88], [100.0, 100.25], [104.0, 122.15], [123.0, 123.43], [124.0, 127.4], [128.0, 129.86]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [36.22, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.47, 0.0, 76.7, 84.8, 31.15, 0.0, 0.0, 29.91, 29.47, 35.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.55, 0.0, 92.97, 0.0], "audiomae_on_audioset": [[["music", 37.8], ["speech", 14.74], ["musical instrument", 10.0]], [["music", 25.07], ["keyboard (musical)", 24.8], ["piano", 19.57]], null, null, null, null, null, null, [["music", 65.71], ["speech", 14.02], ["musical instrument", 4.95]], null, null, null, [["music", 74.44], ["musical instrument", 5.18], ["electronic music", 2.06]], null, null, [["music", 53.86], ["synthesizer", 4.45], ["musical instrument", 4.2]], [["music", 50.16], ["speech", 14.35], ["cacophony", 7.38]], [["music", 65.57], ["timpani", 7.94], ["musical instrument", 3.16]], null, null, null, null, null, null, null, [["gong", 35.3], ["music", 21.58], ["musical instrument", 6.88]], null, null, null], "duration": [4.21, 6.46, 0.02, 0.44, 0.66, 0.92, 1.03, 0.79, 4.08, -0.11, 2.67, 3.35, 7.52, 0.03, 0.02, 2.34, 4.55, 8.68, 0.42, 1.19, -0.02, 0.72, 0.07, 1.88, 0.25, 18.15, 0.43, 3.4, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/cJeYngoI1oA_filtered.json b/annotations_filtered/cJeYngoI1oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8cb1c4b5b6a44816f39def13cdad0c1a18e2202 --- /dev/null +++ b/annotations_filtered/cJeYngoI1oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.7], [22.0, 31.83], [32.0, 33.98], [35.0, 38.92], [41.0, 42.15], [43.0, 56.37], [57.0, 59.09], [59.0, 64.64], [65.0, 71.12], [72.0, 72.62], [73.0, 77.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 9.83, 1.98, 3.92, 1.15, 13.37, 2.09, 5.64, 6.12, 0.62, 4.35]} \ No newline at end of file diff --git a/annotations_filtered/cJti4-26uFE_filtered.json b/annotations_filtered/cJti4-26uFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a055e81deac368787696245c8f515dedf1b0fd8c --- /dev/null +++ b/annotations_filtered/cJti4-26uFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 40.44], [43.0, 61.47], [63.0, 74.8], [77.0, 77.9], [80.0, 80.05], [86.0, 88.74]], "keep_status": [false, false, false, false, false, false], "silence_prob": [31.23, 29.61, 35.1, 0.0, 0.0, 99.76], "audiomae_on_audioset": [[["whale vocalization", 52.61], ["theremin", 23.1], ["music", 4.86]], [["music", 65.55], ["didgeridoo", 4.78], ["cacophony", 3.54]], [["gong", 58.39], ["music", 12.22], ["breaking", 3.93]], null, null, null], "duration": [29.44, 18.47, 11.8, 0.9, 0.05, 2.74]} \ No newline at end of file diff --git a/annotations_filtered/cJyhEAxnQ-U_filtered.json b/annotations_filtered/cJyhEAxnQ-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72c5d0af370939dac5fe1c0e3f8c13f2e97d43af --- /dev/null +++ b/annotations_filtered/cJyhEAxnQ-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [7.0, 8.72], [11.0, 12.53], [16.0, 16.51], [18.0, 20.01], [23.0, 24.53], [27.0, 27.51], [29.0, 32.95], [38.0, 38.7], [40.0, 41.74], [44.0, 47.49], [49.0, 49.59], [52.0, 52.56], [54.0, 53.99], [57.0, 57.4], [59.0, 59.97], [62.0, 62.58], [66.0, 67.68], [71.0, 72.76], [74.0, 78.06], [80.0, 81.31], [84.0, 85.92], [88.0, 88.62], [91.0, 92.77], [93.0, 94.64], [96.0, 98.31], [100.0, 102.88], [105.0, 108.8], [110.0, 111.91], [113.0, 115.18], [116.0, 117.8], [119.0, 119.43], [121.0, 121.86], [123.0, 125.22]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 43.28, 0.0, 0.0, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 40.34, 55.04, 0.0, 48.23, 0.0, 0.0, 0.0, 65.67], "audiomae_on_audioset": [null, null, null, null, [["music", 24.72], ["speech", 22.71], ["sidetone", 14.64]], null, null, [["music", 35.67], ["singing bowl", 12.75], ["hum", 10.82]], null, null, [["music", 66.45], ["gong", 12.22], ["hum", 3.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 36.12], ["sidetone", 26.86], ["music", 12.49]], [["sidetone", 73.73], ["music", 13.99], ["mains hum", 4.46]], null, null, [["music", 28.1], ["speech", 14.85], ["sidetone", 9.51]], null, null, null, null], "duration": [0.75, 1.72, 1.53, 0.51, 2.01, 1.53, 0.51, 3.95, 0.7, 1.74, 3.49, 0.59, 0.56, -0.01, 0.4, 0.97, 0.58, 1.68, 1.76, 4.06, 1.31, 1.92, 0.62, 1.77, 1.64, 2.31, 2.88, 3.8, 1.91, 2.18, 1.8, 0.43, 0.86, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/cKewmzrevAw_filtered.json b/annotations_filtered/cKewmzrevAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54d64e4b4551bd46c8f62f9d26f7cb227f7cb0e7 --- /dev/null +++ b/annotations_filtered/cKewmzrevAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.45], [17.0, 21.03], [24.0, 24.07], [25.0, 52.15], [56.0, 56.2], [61.0, 60.59], [61.0, 66.83], [67.0, 68.66], [71.0, 71.24], [72.0, 73.04], [78.0, 84.23], [87.0, 87.98], [90.0, 91.08], [93.0, 93.5], [99.0, 99.77], [102.0, 103.1], [105.0, 105.36], [107.0, 108.23], [113.0, 113.91], [115.0, 116.28]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.57, 31.46, 0.0, 29.91, 0.0, 0.0, 33.48, 0.0, 0.0, 0.0, 40.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 72.96], ["hum", 8.1], ["throbbing", 7.97]], [["music", 47.03], ["hum", 8.11], ["throbbing", 6.89]], null, [["hum", 35.77], ["mains hum", 19.8], ["vehicle", 13.56]], null, null, [["sidetone", 39.51], ["speech", 16.89], ["fly, housefly", 15.36]], null, null, null, [["music", 61.09], ["effects unit", 6.28], ["creak", 3.85]], null, null, null, null, null, null, null, null, null], "duration": [9.45, 4.03, 0.07, 27.15, 0.2, -0.41, 5.83, 1.66, 0.24, 1.04, 6.23, 0.98, 1.08, 0.5, 0.77, 1.1, 0.36, 1.23, 0.91, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/cKpV6Wb81Ak_filtered.json b/annotations_filtered/cKpV6Wb81Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..210a3ff8d2d2c060edf06c4b30a3cae6d5635f76 --- /dev/null +++ b/annotations_filtered/cKpV6Wb81Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [8.0, 8.87], [11.0, 12.93], [14.0, 14.01], [15.0, 15.52], [31.0, 30.91], [33.0, 33.59], [36.0, 37.94], [38.0, 46.45], [48.0, 48.76], [56.0, 69.16], [73.0, 77.09], [89.0, 108.28], [111.0, 111.69], [114.0, 116.13], [118.0, 119.82], [125.0, 125.54], [127.0, 129.1], [131.0, 133.96], [135.0, 137.29], [140.0, 175.24]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.18, 0.0, 32.71, 31.37, 34.13, 0.0, 99.95, 0.0, 0.0, 98.51, 94.81, 99.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 53.44], ["slosh", 7.64], ["gurgling", 7.42]], null, [["speech", 50.44], ["groan", 24.15], ["music", 11.96]], [["music", 21.27], ["speech", 18.02], ["skateboard", 6.06]], [["music", 39.99], ["speech", 12.57], ["livestock, farm animals, working animals", 9.25]], null, null, null, null, null, null, null, null], "duration": [0.5, 0.87, 1.93, 0.01, 0.52, -0.09, 0.59, 1.94, 8.45, 0.76, 13.16, 4.09, 19.28, 0.69, 2.13, 1.82, 0.54, 2.1, 2.96, 2.29, 35.24]} \ No newline at end of file diff --git a/annotations_filtered/cKw1b2-4aeU_filtered.json b/annotations_filtered/cKw1b2-4aeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bd67ba0d8dc765975e9bd263a5d708fda03cefa --- /dev/null +++ b/annotations_filtered/cKw1b2-4aeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.24], [8.0, 8.6], [10.0, 10.88], [16.0, 17.85], [23.0, 24.83], [31.0, 31.95], [47.0, 48.12], [66.0, 66.65], [67.0, 71.12], [73.0, 73.77], [76.0, 76.08], [87.0, 92.11], [92.0, 95.25], [96.0, 96.43], [108.0, 108.97], [110.0, 109.85], [117.0, 117.59], [118.0, 119.85], [122.0, 122.69], [125.0, 125.78], [139.0, 139.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 40.28, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["creak", 12.66], ["fart", 10.42], ["cattle, bovinae", 6.68]], null, null, null, null, null, null, null, null, null], "duration": [2.24, 0.6, 0.88, 1.85, 1.83, 0.95, 1.12, 0.65, 4.12, 0.77, 0.08, 5.11, 3.25, 0.43, 0.97, -0.15, 0.59, 1.85, 0.69, 0.78, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/cLTBa54o70U_filtered.json b/annotations_filtered/cLTBa54o70U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3166f6655ee6a919c3ff817ad33a1004cbd42f95 --- /dev/null +++ b/annotations_filtered/cLTBa54o70U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 3.69], [6.0, 6.81], [7.0, 10.64], [12.0, 13.12], [23.0, 30.91], [35.0, 36.73], [39.0, 41.25], [42.0, 44.71], [46.0, 46.5], [49.0, 53.22], [54.0, 84.43], [85.0, 86.54], [89.0, 88.97], [90.0, 102.12], [103.0, 103.25], [103.0, 103.5], [105.0, 104.79], [106.0, 110.61], [120.0, 119.96]], "keep_status": [false, false, false, true, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.67, 0.0, 30.16, 0.0, 32.08, 31.71, 0.0, 38.28, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0, 71.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 25.37], ["speech", 14.32], ["moo", 6.99]], null, [["music", 45.25], ["moo", 7.19], ["livestock, farm animals, working animals", 5.8]], null, [["music", 54.86], ["drum machine", 6.04], ["synthesizer", 3.64]], [["music", 36.7], ["speech", 20.39], ["synthesizer", 4.39]], null, [["hum", 43.84], ["mains hum", 17.07], ["vehicle", 6.09]], null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.69, 0.81, 3.64, 1.12, 7.91, 1.73, 2.25, 2.71, 0.5, 4.22, 30.43, 1.54, -0.03, 12.12, 0.25, 0.5, -0.21, 4.61, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/cLYCKmqJApw_filtered.json b/annotations_filtered/cLYCKmqJApw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a812ad9021a3d1a6212ca2b026c97a9c2eb627 --- /dev/null +++ b/annotations_filtered/cLYCKmqJApw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 63.44], [65.0, 73.4], [73.0, 73.79], [74.0, 82.11], [91.0, 91.03], [92.0, 93.51], [94.0, 95.57], [97.0, 97.17], [100.0, 100.21], [104.0, 104.25], [112.0, 113.02], [114.0, 115.5], [116.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.16, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 8.4, 0.79, 8.11, 0.03, 1.51, 1.57, 0.17, 0.21, 0.25, 1.02, 1.5, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/cLc_O-kQOoc_filtered.json b/annotations_filtered/cLc_O-kQOoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04c304ffa14ccd25d006bf4de4805e1eb9125f2f --- /dev/null +++ b/annotations_filtered/cLc_O-kQOoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.86], [22.0, 25.32], [28.0, 36.24], [48.0, 55.09], [61.0, 75.36], [82.0, 88.84], [95.0, 94.66], [95.0, 96.31], [99.0, 107.43], [111.0, 113.37]], "keep_status": [false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 99.48, 95.64, 54.56, 37.57, 36.82, 0.0, 0.0, 33.23, 39.01], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.76], ["music", 22.15], ["whack, thwack", 6.33]], [["music", 39.77], ["speech", 19.19], ["didgeridoo", 18.53]], null, null, [["speech", 60.3], ["music", 16.88], ["hum", 3.81]], [["hum", 29.63], ["speech", 20.16], ["mains hum", 19.35]]], "duration": [0.86, 3.32, 8.24, 7.09, 14.36, 6.84, -0.34, 1.31, 8.43, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/cLm4oCbovsE_filtered.json b/annotations_filtered/cLm4oCbovsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cf1e0d4763b799da496d3bfd5015df0ee6e2490 --- /dev/null +++ b/annotations_filtered/cLm4oCbovsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.98], [3.0, 4.31], [7.0, 8.14], [11.0, 11.48], [12.0, 12.77], [15.0, 15.89], [23.0, 25.34], [28.0, 27.7], [31.0, 32.51], [33.0, 32.61], [48.0, 48.41], [59.0, 59.36], [66.0, 66.34], [85.0, 85.53], [93.0, 95.17], [101.0, 101.58], [113.0, 115.25], [117.0, 117.73], [119.0, 120.19], [124.0, 126.96], [129.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0, 38.93, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 49.02], ["speech", 16.96], ["synthesizer", 10.15]], null, null, null, null, null, null, null, [["music", 58.29], ["scratching (performance technique)", 6.3], ["electronic music", 4.43]], null, [["music", 64.14], ["synthesizer", 6.61], ["musical instrument", 4.62]], null, null, null, null], "duration": [-0.02, 1.31, 1.14, 0.48, 0.77, 0.89, 2.34, -0.3, 1.51, -0.39, 0.41, 0.36, 0.34, 0.53, 2.17, 0.58, 2.25, 0.73, 1.19, 2.96, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/cLomnZIvoFs_filtered.json b/annotations_filtered/cLomnZIvoFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ad466d954dcec70ba40773b210babb054e70f6 --- /dev/null +++ b/annotations_filtered/cLomnZIvoFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.53], [20.0, 20.65], [22.0, 24.9], [28.0, 29.71], [32.0, 31.7], [34.0, 34.52], [36.0, 49.5], [53.0, 61.01], [63.0, 66.88], [68.0, 67.8], [80.0, 79.79], [80.0, 79.93], [80.0, 80.0], [92.0, 93.61], [98.0, 99.28], [103.0, 104.18], [109.0, 110.19], [114.0, 115.4], [116.0, 118.34], [122.0, 125.83], [135.0, 136.68], [160.0, 164.29], [203.0, 203.27], [204.0, 207.01], [214.0, 214.79]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [38.62, 0.0, 68.54, 0.0, 0.0, 0.0, 41.2, 37.12, 38.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 35.13, 0.0, 31.5, 0.0, 32.42, 0.0], "audiomae_on_audioset": [[["music", 34.24], ["hum", 15.42], ["speech", 14.49]], null, null, null, null, null, [["hum", 44.57], ["mains hum", 40.88], ["throbbing", 3.41]], [["hum", 46.05], ["music", 10.21], ["throbbing", 9.64]], [["music", 32.62], ["throbbing", 19.51], ["hum", 17.42]], null, null, null, null, null, null, null, null, null, null, [["music", 27.99], ["speech", 23.79], ["synthesizer", 7.63]], null, [["music", 61.99], ["hum", 5.1], ["mains hum", 5.05]], null, [["music", 51.64], ["speech", 11.06], ["sidetone", 2.8]], null], "duration": [15.53, 0.65, 2.9, 1.71, -0.3, 0.52, 13.5, 8.01, 3.88, -0.2, -0.21, -0.07, 0.0, 1.61, 1.28, 1.18, 1.19, 1.4, 2.34, 3.83, 1.68, 4.29, 0.27, 3.01, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/cM2U8v8OuLo_filtered.json b/annotations_filtered/cM2U8v8OuLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e9404c78f3a1c298835a42fc914ab384cee5f7b --- /dev/null +++ b/annotations_filtered/cM2U8v8OuLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [6.0, 5.64], [7.0, 6.59], [8.0, 10.3], [13.0, 14.77], [17.0, 17.58], [21.0, 21.0], [24.0, 24.22], [27.0, 30.43], [32.0, 44.41], [74.0, 74.75], [76.0, 77.16], [78.0, 78.98], [80.0, 81.13], [83.0, 83.59], [85.0, 85.41], [87.0, 87.56], [94.0, 94.0], [98.0, 98.46], [102.0, 102.07], [105.0, 105.11], [107.0, 107.27], [111.0, 112.08], [113.0, 113.44], [114.0, 114.66], [119.0, 122.91]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 41.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 30.82], ["thunk", 15.84], ["hum", 14.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, -0.36, -0.41, 2.3, 1.77, 0.58, 0.0, 0.22, 3.43, 12.41, 0.75, 1.16, 0.98, 1.13, 0.59, 0.41, 0.56, 0.0, 0.46, 0.07, 0.11, 0.27, 1.08, 0.44, 0.66, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/cMFosgxgPAs_filtered.json b/annotations_filtered/cMFosgxgPAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b35dd34ab6f79898d56e3b83f0e6fa54924f0ef5 --- /dev/null +++ b/annotations_filtered/cMFosgxgPAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.2], [19.0, 19.47], [25.0, 25.17], [27.0, 28.85], [31.0, 35.68], [38.0, 38.97], [44.0, 44.93], [52.0, 57.18], [64.0, 65.82], [68.0, 115.74], [117.0, 122.4], [125.0, 131.25], [132.0, 132.07], [134.0, 134.97], [136.0, 137.32], [140.0, 139.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [44.29, 0.0, 0.0, 0.0, 63.96, 0.0, 0.0, 38.41, 0.0, 0.0, 31.14, 30.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 38.9], ["throbbing", 26.65], ["music", 13.23]], null, null, null, null, null, null, [["speech", 40.1], ["music", 36.09], ["drum machine", 6.81]], null, null, [["music", 78.09], ["musical instrument", 4.52], ["bass guitar", 3.45]], [["music", 31.42], ["door", 8.28], ["hum", 6.56]], null, null, null, null], "duration": [2.2, 0.47, 0.17, 1.85, 4.68, 0.97, 0.93, 5.18, 1.82, 47.74, 5.4, 6.25, 0.07, 0.97, 1.32, -0.37]} \ No newline at end of file diff --git a/annotations_filtered/cMNvYJ6O_Ks_filtered.json b/annotations_filtered/cMNvYJ6O_Ks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b92965b4cb5bb7cf21a395e9f06d9608e27e8d --- /dev/null +++ b/annotations_filtered/cMNvYJ6O_Ks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.57], [20.0, 20.7], [22.0, 22.62], [29.0, 30.37], [36.0, 37.12], [49.0, 49.5], [56.0, 57.64], [59.0, 60.22], [68.0, 68.54], [72.0, 72.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.7, 0.62, 1.37, 1.12, 0.5, 1.64, 1.22, 0.54, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/cMPXArN7f9k_filtered.json b/annotations_filtered/cMPXArN7f9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..353ea2b2b770f7d0f1655c6ac7f24352d0bf9c96 --- /dev/null +++ b/annotations_filtered/cMPXArN7f9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.25], [15.0, 16.06], [22.0, 23.04], [23.0, 30.05], [31.0, 37.05], [39.0, 45.67], [48.0, 48.02], [48.0, 50.13], [53.0, 53.28], [65.0, 71.34], [72.0, 73.16], [74.0, 75.39], [77.0, 92.67], [95.0, 96.94], [98.0, 111.1], [111.0, 113.04], [115.0, 115.15], [116.0, 115.87], [116.0, 119.65], [120.0, 119.74], [120.0, 121.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.59, 0.0, 0.0, 66.03, 94.52, 78.21, 0.0, 51.6, 0.0, 80.64, 0.0, 0.0, 99.97, 0.0, 95.09, 91.47, 0.0, 0.0, 59.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.25, 1.06, 1.04, 7.05, 6.05, 6.67, 0.02, 2.13, 0.28, 6.34, 1.16, 1.39, 15.67, 1.94, 13.1, 2.04, 0.15, -0.13, 3.65, -0.26, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/cMmi5sRe8wc_filtered.json b/annotations_filtered/cMmi5sRe8wc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ad2f4741363a21b13cd179e1e8bf7b5af32c31 --- /dev/null +++ b/annotations_filtered/cMmi5sRe8wc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [13.0, 13.29], [15.0, 14.94], [17.0, 17.17], [30.0, 30.77], [37.0, 37.0], [43.0, 43.83], [47.0, 47.82], [50.0, 50.52], [52.0, 56.91], [57.0, 69.26], [72.0, 72.2], [75.0, 79.42], [81.0, 113.44], [114.0, 128.44], [132.0, 132.29], [134.0, 150.55], [155.0, 168.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 30.47, 0.0, 31.6, 0.0, 37.78, 0.0, 38.94, 35.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 50.86], ["mains hum", 15.56], ["speech", 8.61]], [["hum", 14.49], ["music", 7.68], ["speech", 7.28]], null, [["music", 26.62], ["buzz", 13.62], ["sound effect", 7.99]], null, [["music", 81.45], ["scary music", 2.29], ["soundtrack music", 1.77]], null, [["music", 64.15], ["hum", 6.81], ["gong", 5.72]], [["music", 81.79], ["ambient music", 4.82], ["electronic music", 2.67]]], "duration": [1.07, 0.29, -0.06, 0.17, 0.77, 0.0, 0.83, 0.82, 0.52, 4.91, 12.26, 0.2, 4.42, 32.44, 14.44, 0.29, 16.55, 13.84]} \ No newline at end of file diff --git a/annotations_filtered/cMnkhxzCLyA_filtered.json b/annotations_filtered/cMnkhxzCLyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1e59f79786bdd9e1b77bb65d067de8a2866dcd4 --- /dev/null +++ b/annotations_filtered/cMnkhxzCLyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.29], [12.0, 12.85], [18.0, 18.96], [22.0, 23.14], [26.0, 53.45]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.61], "audiomae_on_audioset": [null, null, null, null, [["music", 90.65], ["musical instrument", 1.67], ["electronic music", 1.46]]], "duration": [0.29, 0.85, 0.96, 1.14, 27.45]} \ No newline at end of file diff --git a/annotations_filtered/cMwOJoesx8M_filtered.json b/annotations_filtered/cMwOJoesx8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afcc141680a926b75cd5b63aac0913790272d7a8 --- /dev/null +++ b/annotations_filtered/cMwOJoesx8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [9.0, 9.51], [12.0, 12.95], [14.0, 14.25], [19.0, 19.65], [21.0, 21.29], [23.0, 25.62], [30.0, 30.23], [38.0, 38.37], [41.0, 41.74], [62.0, 63.73], [66.0, 67.17], [70.0, 70.77], [72.0, 72.59], [75.0, 76.94], [79.0, 79.2], [83.0, 83.19], [86.0, 88.1], [92.0, 93.06], [103.0, 103.1], [105.0, 106.64], [108.0, 108.62], [110.0, 112.94], [115.0, 123.87], [125.0, 126.23], [129.0, 130.76], [131.0, 132.19], [133.0, 133.96], [135.0, 137.3], [138.0, 138.86], [141.0, 143.5], [146.0, 147.61], [151.0, 151.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 94.95, 72.16, 0.0, 0.0, 0.0, 0.0, 62.47, 0.0, 68.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 0.51, 0.95, 0.25, 0.65, 0.29, 2.62, 0.23, 0.37, 0.74, 1.73, 1.17, 0.77, 0.59, 1.94, 0.2, 0.19, 2.1, 1.06, 0.1, 1.64, 0.62, 2.94, 8.87, 1.23, 1.76, 1.19, 0.96, 2.3, 0.86, 2.5, 1.61, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/cMxPAkZgoy0_filtered.json b/annotations_filtered/cMxPAkZgoy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a721a4690ebd1b1ce455ad610d7fc34f73cf3759 --- /dev/null +++ b/annotations_filtered/cMxPAkZgoy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.69], [6.0, 7.26], [8.0, 9.1], [13.0, 26.0], [28.0, 31.18], [40.0, 41.3], [43.0, 42.92], [55.0, 55.09], [59.0, 60.83], [62.0, 63.49], [64.0, 65.85], [67.0, 69.62], [70.0, 72.27], [73.0, 75.0], [76.0, 81.08], [83.0, 85.78], [86.0, 88.89], [90.0, 105.27], [107.0, 111.89], [114.0, 114.42], [119.0, 119.8], [122.0, 122.32]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.93, 33.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 36.35, 36.58, 31.99, 34.32, 33.22, 30.29, 30.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 22.61], ["vehicle", 6.43], ["whack, thwack", 5.68]], [["speech", 63.99], ["outside, urban or manmade", 5.25], ["crowd", 4.75]], null, null, null, null, null, null, [["fly, housefly", 32.28], ["insect", 27.47], ["bee, wasp, etc.", 21.1]], [["speech", 66.22], ["animal", 4.82], ["dog", 4.32]], [["speech", 53.18], ["music", 5.04], ["sidetone", 4.4]], [["speech", 49.08], ["run", 7.74], ["animal", 7.65]], [["speech", 45.81], ["music", 4.13], ["cattle, bovinae", 3.3]], [["speech", 59.33], ["crowd", 8.07], ["cheering", 7.14]], [["speech", 43.28], ["crowd", 4.44], ["outside, urban or manmade", 3.81]], [["cheering", 34.74], ["crowd", 27.95], ["speech", 14.73]], null, null, null], "duration": [-0.31, 1.26, 1.1, 13.0, 3.18, 1.3, -0.08, 0.09, 1.83, 1.49, 1.85, 2.62, 2.27, 2.0, 5.08, 2.78, 2.89, 15.27, 4.89, 0.42, 0.8, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/cNLFuTms4go_filtered.json b/annotations_filtered/cNLFuTms4go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82fbc49503690c0f3babdd98e9a849e4e4ba3371 --- /dev/null +++ b/annotations_filtered/cNLFuTms4go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.04], [18.0, 20.12], [21.0, 28.76], [32.0, 33.57], [34.0, 42.72], [46.0, 47.36], [48.0, 50.08], [52.0, 52.95], [58.0, 59.37], [60.0, 61.42], [62.0, 63.56], [65.0, 66.39], [68.0, 68.86], [70.0, 70.04], [72.0, 78.16], [80.0, 81.43], [82.0, 84.37], [85.0, 87.86], [89.0, 89.77], [90.0, 91.02], [91.0, 92.15], [93.0, 96.62], [98.0, 104.14], [108.0, 109.81], [117.0, 117.1], [118.0, 120.16], [121.0, 121.15], [122.0, 125.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 97.11, 0.0, 61.18, 0.0, 54.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 70.02, 61.47, 0.0, 0.0, 0.0, 69.07, 73.06, 0.0, 0.0, 56.33, 0.0, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.04, 2.12, 7.76, 1.57, 8.72, 1.36, 2.08, 0.95, 1.37, 1.42, 1.56, 1.39, 0.86, 0.04, 6.16, 1.43, 2.37, 2.86, 0.77, 1.02, 1.15, 3.62, 6.14, 1.81, 0.1, 2.16, 0.15, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/cNOsA4nH8yE_filtered.json b/annotations_filtered/cNOsA4nH8yE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c2790a8b7fbeacfb2c797462c833826d3f267c5 --- /dev/null +++ b/annotations_filtered/cNOsA4nH8yE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.97], [3.0, 4.31], [5.0, 5.22], [5.0, 6.27], [9.0, 13.14], [16.0, 17.27], [18.0, 19.82], [21.0, 20.83], [23.0, 22.94], [23.0, 24.7], [29.0, 28.88], [30.0, 33.81], [36.0, 35.77], [36.0, 36.56], [37.0, 37.29], [38.0, 37.72], [40.0, 40.56], [45.0, 45.5], [50.0, 50.13], [52.0, 59.8], [67.0, 67.24], [69.0, 69.87], [70.0, 71.15], [72.0, 72.47], [73.0, 73.99], [75.0, 75.37], [76.0, 76.49], [78.0, 83.51], [84.0, 83.59], [84.0, 83.66], [84.0, 83.89], [89.0, 89.97]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 38.66], ["music", 23.83], ["radio", 5.76]], null, null, null, null, null, null, [["speech", 85.83], ["sidetone", 4.53], ["radio", 1.46]], null, null, null, null, null, null, null, [["speech", 58.06], ["music", 16.58], ["electric shaver, electric razor", 10.52]], null, null, null, null, null, null, null, [["speech", 78.86], ["music", 6.16], ["electric shaver, electric razor", 1.99]], null, null, null, null], "duration": [-0.03, 1.31, 0.22, 1.27, 4.14, 1.27, 1.82, -0.17, -0.06, 1.7, -0.12, 3.81, -0.23, 0.56, 0.29, -0.28, 0.56, 0.5, 0.13, 7.8, 0.24, 0.87, 1.15, 0.47, 0.99, 0.37, 0.49, 5.51, -0.41, -0.34, -0.11, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/cNW7dRdPPC8_filtered.json b/annotations_filtered/cNW7dRdPPC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e8679c8d0755b4ac9331a6e043f5561e900282e --- /dev/null +++ b/annotations_filtered/cNW7dRdPPC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [8.0, 8.36], [11.0, 11.65], [18.0, 18.47], [19.0, 20.16], [22.0, 22.98], [24.0, 24.51], [25.0, 27.65], [28.0, 33.12], [38.0, 38.15], [40.0, 44.17], [46.0, 50.11], [52.0, 52.3], [54.0, 54.6], [58.0, 61.38], [63.0, 62.92], [64.0, 64.29], [69.0, 70.12], [72.0, 72.17], [73.0, 74.58], [76.0, 76.64], [77.0, 77.23], [79.0, 79.46], [81.0, 81.43], [82.0, 83.17], [86.0, 87.42], [90.0, 90.66], [95.0, 96.26], [97.0, 103.1], [104.0, 104.52], [106.0, 108.94], [112.0, 116.77], [117.0, 117.39], [118.0, 119.72], [120.0, 122.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.93, 0.0, 100.0, 99.99, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 52.98, 99.59, 0.0, 0.0, 75.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.36, 0.65, 0.47, 1.16, 0.98, 0.51, 2.65, 5.12, 0.15, 4.17, 4.11, 0.3, 0.6, 3.38, -0.08, 0.29, 1.12, 0.17, 1.58, 0.64, 0.23, 0.46, 0.43, 1.17, 1.42, 0.66, 1.26, 6.1, 0.52, 2.94, 4.77, 0.39, 1.72, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/cNiuEFffzf4_filtered.json b/annotations_filtered/cNiuEFffzf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba8eb823511564d72a3a46db438d99af92c16e4 --- /dev/null +++ b/annotations_filtered/cNiuEFffzf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [7.0, 9.66], [11.0, 12.26], [13.0, 18.12], [20.0, 21.76], [24.0, 25.39], [26.0, 27.26], [31.0, 31.68], [32.0, 33.13], [34.0, 35.77], [36.0, 38.92], [42.0, 43.39], [44.0, 45.86], [49.0, 51.02], [54.0, 54.51], [56.0, 60.89], [62.0, 63.05], [65.0, 65.45], [68.0, 68.72], [70.0, 74.73], [75.0, 75.46], [76.0, 78.02], [81.0, 81.18], [83.0, 85.35], [86.0, 87.13], [89.0, 90.04], [93.0, 92.64], [93.0, 95.64], [98.0, 98.91], [100.0, 103.1], [105.0, 105.63], [111.0, 111.2], [112.0, 113.41], [116.0, 116.82], [119.0, 119.65], [124.0, 125.02], [129.0, 129.69], [131.0, 132.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 99.21, 0.0, 99.96, 0.0, 0.0, 0.0, 99.99, 0.0, 99.96, 0.0, 99.98, 0.0, 0.0, 0.0, 99.88, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 2.66, 1.26, 5.12, 1.76, 1.39, 1.26, 0.68, 1.13, 1.77, 2.92, 1.39, 1.86, 2.02, 0.51, 4.89, 1.05, 0.45, 0.72, 4.73, 0.46, 2.02, 0.18, 2.35, 1.13, 1.04, -0.36, 2.64, 0.91, 3.1, 0.63, 0.2, 1.41, 0.82, 0.65, 1.02, 0.69, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/cNqSc_WsRJ4_filtered.json b/annotations_filtered/cNqSc_WsRJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84258410ea225fce52aad66ea3ae8e04c30bee78 --- /dev/null +++ b/annotations_filtered/cNqSc_WsRJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.17], [21.0, 22.94], [25.0, 25.35], [26.0, 27.62], [28.0, 28.63], [32.0, 32.98], [37.0, 37.44], [40.0, 40.93], [47.0, 49.42], [51.0, 51.81], [54.0, 55.39], [58.0, 57.84], [59.0, 59.59], [61.0, 61.84], [68.0, 68.61], [70.0, 70.17], [74.0, 74.41], [76.0, 78.76], [80.0, 80.43], [81.0, 81.4], [82.0, 84.65], [86.0, 88.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 82.07, 82.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.17, 1.94, 0.35, 1.62, 0.63, 0.98, 0.44, 0.93, 2.42, 0.81, 1.39, -0.16, 0.59, 0.84, 0.61, 0.17, 0.41, 2.76, 0.43, 0.4, 2.65, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/cNqstBuw5ZY_filtered.json b/annotations_filtered/cNqstBuw5ZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..608276f95538671894e5ab0866ec899de7593118 --- /dev/null +++ b/annotations_filtered/cNqstBuw5ZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.09], [12.0, 12.16], [12.0, 21.83], [22.0, 23.21], [24.0, 76.65], [79.0, 98.49], [99.0, 99.76], [100.0, 103.55], [105.0, 105.06], [106.0, 106.34], [109.0, 112.31], [113.0, 119.37], [120.0, 120.78]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.47, 0.0, 0.0, 37.49, 0.0, 57.32, 0.0, 0.0, 100.0, 84.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["beatboxing", 29.11], ["wail, moan", 18.21], ["music", 8.74]], null, null, null, null, null, null, null], "duration": [0.09, 0.16, 9.83, 1.21, 52.65, 19.49, 0.76, 3.55, 0.06, 0.34, 3.31, 6.37, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/cOE2gQrXchk_filtered.json b/annotations_filtered/cOE2gQrXchk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83eb21409bb5c023c0e49a62ecd126cf16988f4a --- /dev/null +++ b/annotations_filtered/cOE2gQrXchk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.78], [30.0, 35.24], [36.0, 37.32], [39.0, 39.46], [40.0, 41.15], [42.0, 44.36], [46.0, 47.38], [48.0, 49.3], [50.0, 50.57], [51.0, 51.41], [52.0, 53.4], [56.0, 59.48], [60.0, 61.82], [62.0, 66.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 56.78, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 38.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.0], ["fly, housefly", 17.45], ["insect", 9.84]]], "duration": [0.78, 5.24, 1.32, 0.46, 1.15, 2.36, 1.38, 1.3, 0.57, 0.41, 1.4, 3.48, 1.82, 4.31]} \ No newline at end of file diff --git a/annotations_filtered/cOXVnmVPdtQ_filtered.json b/annotations_filtered/cOXVnmVPdtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..353f86007e19b7ef7c45740d47b9cd0bbf18f1b3 --- /dev/null +++ b/annotations_filtered/cOXVnmVPdtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [5.0, 5.85], [8.0, 8.21], [9.0, 10.86], [13.0, 15.01], [16.0, 18.3], [21.0, 22.76], [26.0, 30.82], [34.0, 43.83], [45.0, 46.06], [48.0, 48.41], [49.0, 50.25], [54.0, 56.32], [59.0, 60.83], [62.0, 62.33], [64.0, 68.22], [69.0, 70.83], [72.0, 73.13], [74.0, 75.56], [77.0, 99.13], [100.0, 102.17], [103.0, 103.76], [106.0, 106.96], [107.0, 108.65], [109.0, 111.7], [112.0, 114.32], [115.0, 115.75], [117.0, 123.09], [123.0, 126.44], [127.0, 129.91], [130.0, 141.89], [142.0, 143.63], [145.0, 146.62], [150.0, 152.47]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.84, 35.93, 0.0, 31.74, 32.86, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 48.19, 0.0, 0.0, 0.0, 95.64, 100.0, 0.0, 0.0, 0.0, 97.73, 99.93, 0.0, 98.99, 86.82, 97.54, 82.79, 0.0, 0.0, 92.97], "audiomae_on_audioset": [null, null, null, null, [["music", 68.77], ["guitar", 5.16], ["musical instrument", 4.97]], [["music", 47.69], ["speech", 13.17], ["musical instrument", 7.25]], null, [["music", 76.96], ["theremin", 5.9], ["synthesizer", 2.44]], [["music", 65.6], ["animal", 9.74], ["dog", 5.86]], null, null, null, null, null, null, [["music", 34.04], ["speech", 8.29], ["musical instrument", 7.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 0.85, 0.21, 1.86, 2.01, 2.3, 1.76, 4.82, 9.83, 1.06, 0.41, 1.25, 2.32, 1.83, 0.33, 4.22, 1.83, 1.13, 1.56, 22.13, 2.17, 0.76, 0.96, 1.65, 2.7, 2.32, 0.75, 6.09, 3.44, 2.91, 11.89, 1.63, 1.62, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/cOyt0_sRRvU_filtered.json b/annotations_filtered/cOyt0_sRRvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96eb0a11b8364a0bf39dd3bb7f8c8e82be24a318 --- /dev/null +++ b/annotations_filtered/cOyt0_sRRvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.83], [14.0, 13.93], [14.0, 18.39], [19.0, 19.7], [22.0, 23.23], [24.0, 25.19], [32.0, 32.02], [34.0, 34.84], [36.0, 37.44], [39.0, 40.14], [42.0, 46.38], [48.0, 47.95], [48.0, 48.05], [49.0, 50.52], [51.0, 52.76], [54.0, 59.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.54, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 86.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.83, -0.07, 4.39, 0.7, 1.23, 1.19, 0.02, 0.84, 1.44, 1.14, 4.38, -0.05, 0.05, 1.52, 1.76, 5.07]} \ No newline at end of file diff --git a/annotations_filtered/cP4Q_O_ZKWA_filtered.json b/annotations_filtered/cP4Q_O_ZKWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d7555a941992c6b3b971e1d43b9800d8ddb217 --- /dev/null +++ b/annotations_filtered/cP4Q_O_ZKWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.9], [10.0, 10.99], [12.0, 12.56], [13.0, 15.58], [16.0, 58.09], [60.0, 94.39], [100.0, 108.68], [111.0, 114.13]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 29.58, 30.78], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 13.74], ["groan", 12.5], ["music", 7.58]], [["cattle, bovinae", 29.78], ["livestock, farm animals, working animals", 18.27], ["music", 18.07]]], "duration": [0.9, 0.99, 0.56, 2.58, 42.09, 34.39, 8.68, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/cP63R4QwDFI_filtered.json b/annotations_filtered/cP63R4QwDFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c88e7e67d34e603efe0b6ad9aa38ccc79c459a10 --- /dev/null +++ b/annotations_filtered/cP63R4QwDFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.75], [6.0, 8.5], [10.0, 13.22], [15.0, 18.01], [21.0, 24.83], [29.0, 37.34], [40.0, 43.9], [46.0, 50.75], [52.0, 55.49]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.97, 91.81, 78.89, 66.63, 56.55, 38.94, 38.0, 59.86], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.71], ["timpani", 4.36], ["percussion", 4.21]], [["music", 39.4], ["rumble", 20.71], ["gong", 11.48]], null], "duration": [1.75, 2.5, 3.22, 3.01, 3.83, 8.34, 3.9, 4.75, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/cP7WEGuVwig_filtered.json b/annotations_filtered/cP7WEGuVwig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08971460c597a28dd6bcfe2aa31930286054d6d0 --- /dev/null +++ b/annotations_filtered/cP7WEGuVwig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 48.54], [50.0, 71.39], [72.0, 87.66], [90.0, 163.22], [164.0, 165.54], [167.0, 167.64]], "keep_status": [false, false, false, false, false, false], "silence_prob": [31.21, 30.96, 30.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.62], ["speech", 34.56], ["throbbing", 2.93]], [["music", 32.17], ["hum", 28.75], ["throbbing", 10.8]], [["throbbing", 37.16], ["hum", 24.59], ["music", 17.57]], null, null, null], "duration": [27.54, 21.39, 15.66, 73.22, 1.54, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/cPVM14Bnf5I_filtered.json b/annotations_filtered/cPVM14Bnf5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcc8444a315fae40c02b637ae575d10c2088285 --- /dev/null +++ b/annotations_filtered/cPVM14Bnf5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.27], [12.0, 13.88], [17.0, 17.25], [21.0, 20.98], [23.0, 23.82], [26.0, 26.79], [33.0, 42.26], [46.0, 48.41], [55.0, 63.63], [67.0, 68.13], [68.0, 71.05], [79.0, 82.81], [85.0, 86.02], [87.0, 87.88], [90.0, 106.17], [107.0, 121.95], [122.0, 122.71], [124.0, 124.51], [138.0, 157.08], [161.0, 161.64]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.52, 34.14, 33.46, 0.0, 33.23, 30.71, 0.0, 0.0, 30.68, 30.73, 0.0, 0.0, 31.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.93], ["music", 8.28], ["explosion", 7.97]], [["music", 42.17], ["throbbing", 5.59], ["speech", 3.25]], [["speech", 54.65], ["music", 15.16], ["hum", 8.17]], null, [["music", 67.81], ["musical instrument", 3.11], ["didgeridoo", 3.08]], [["music", 44.89], ["speech", 7.31], ["musical instrument", 3.74]], null, null, [["cattle, bovinae", 39.41], ["moo", 32.64], ["music", 10.07]], [["music", 56.01], ["electronic music", 11.31], ["techno", 5.62]], null, null, [["music", 78.01], ["musical instrument", 2.45], ["theremin", 1.35]], null], "duration": [0.27, 1.88, 0.25, -0.02, 0.82, 0.79, 9.26, 2.41, 8.63, 1.13, 3.05, 3.81, 1.02, 0.88, 16.17, 14.95, 0.71, 0.51, 19.08, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/cPYdLs7RRRc_filtered.json b/annotations_filtered/cPYdLs7RRRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdcbee687126ada12fd0b17d3ed4158008e9b28c --- /dev/null +++ b/annotations_filtered/cPYdLs7RRRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.32], [17.0, 20.07], [21.0, 22.74], [24.0, 26.91], [29.0, 32.91], [34.0, 39.65], [41.0, 42.8], [44.0, 45.93], [47.0, 49.28], [50.0, 58.35], [59.0, 90.32], [91.0, 91.47], [92.0, 93.07], [94.0, 94.59], [95.0, 96.35], [97.0, 102.44], [103.0, 102.79], [104.0, 110.74], [112.0, 115.89], [116.0, 117.36], [118.0, 119.21], [119.0, 124.7], [125.0, 125.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 99.4, 0.0, 99.95, 100.0, 99.95, 0.0, 0.0, 99.98, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 78.72, 99.87, 0.0, 0.0, 87.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.32, 3.07, 1.74, 2.91, 3.91, 5.65, 1.8, 1.93, 2.28, 8.35, 31.32, 0.47, 1.07, 0.59, 1.35, 5.44, -0.21, 6.74, 3.89, 1.36, 1.21, 5.7, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/cP_OM5VVcSo_filtered.json b/annotations_filtered/cP_OM5VVcSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d02ce231d346bc572bb151dbff7dc22d57ddd574 --- /dev/null +++ b/annotations_filtered/cP_OM5VVcSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.92], [14.0, 15.13], [18.0, 17.91], [32.0, 36.27], [39.0, 39.72], [43.0, 43.92], [44.0, 58.01], [61.0, 61.3], [63.0, 63.07], [65.0, 71.24], [76.0, 76.06], [80.0, 80.84], [85.0, 85.55], [86.0, 138.42], [146.0, 146.28], [149.0, 149.01], [150.0, 151.33], [152.0, 154.62]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.62, 0.0, 0.0, 30.42, 0.0, 0.0, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.11], "audiomae_on_audioset": [null, null, null, [["speech", 21.95], ["fart", 12.63], ["music", 11.89]], null, null, [["music", 74.96], ["boing", 4.89], ["guitar", 2.04]], null, null, [["music", 75.57], ["musical instrument", 4.43], ["cacophony", 3.61]], null, null, null, null, null, null, null, [["moo", 26.35], ["cattle, bovinae", 24.57], ["livestock, farm animals, working animals", 19.47]]], "duration": [1.92, 1.13, -0.09, 4.27, 0.72, 0.92, 14.01, 0.3, 0.07, 6.24, 0.06, 0.84, 0.55, 52.42, 0.28, 0.01, 1.33, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/cPfMxQLlirI_filtered.json b/annotations_filtered/cPfMxQLlirI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..614ffca2ff2f5acb7813840aabae8dfd0d68056a --- /dev/null +++ b/annotations_filtered/cPfMxQLlirI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.16], [25.0, 26.33], [30.0, 39.09], [41.0, 42.08], [43.0, 63.49], [69.0, 70.06], [71.0, 74.68], [76.0, 89.99], [93.0, 98.86], [100.0, 104.16], [105.0, 105.38], [107.0, 109.02], [112.0, 114.51], [119.0, 121.85], [123.0, 123.52], [126.0, 130.1], [132.0, 131.68]], "keep_status": [false, false, true, false, true, false, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 32.51, 0.0, 32.1, 0.0, 29.07, 29.83, 29.45, 29.17, 0.0, 41.62, 56.63, 38.64, 0.0, 56.33, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.49], ["mains hum", 20.91], ["music", 15.01]], null, [["music", 29.55], ["noise", 12.15], ["boing", 11.28]], null, [["hum", 34.72], ["mains hum", 14.81], ["music", 13.7]], [["music", 74.16], ["theremin", 4.84], ["hum", 3.38]], [["music", 54.88], ["hum", 8.43], ["mains hum", 7.02]], [["music", 41.69], ["explosion", 6.7], ["boom", 5.18]], null, [["speech", 33.34], ["hum", 16.45], ["music", 9.98]], null, [["thunk", 39.42], ["whack, thwack", 18.91], ["music", 6.76]], null, null, null], "duration": [1.16, 1.33, 9.09, 1.08, 20.49, 1.06, 3.68, 13.99, 5.86, 4.16, 0.38, 2.02, 2.51, 2.85, 0.52, 4.1, -0.32]} \ No newline at end of file diff --git a/annotations_filtered/cPooLABE6Js_filtered.json b/annotations_filtered/cPooLABE6Js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5e04d5c2ab7764b7b475fe9b73b3cdad2e1b4d1 --- /dev/null +++ b/annotations_filtered/cPooLABE6Js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.05], [11.0, 11.96], [13.0, 12.8], [14.0, 15.97], [18.0, 17.9], [21.0, 21.36], [26.0, 27.24], [28.0, 35.78], [54.0, 56.86], [65.0, 65.35], [76.0, 78.68], [79.0, 80.23], [82.0, 84.05], [88.0, 89.6], [91.0, 92.84], [96.0, 96.6], [104.0, 104.57], [108.0, 109.0], [111.0, 111.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 51.88, 0.0, 97.54, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 0.96, -0.2, 1.97, -0.1, 0.36, 1.24, 7.78, 2.86, 0.35, 2.68, 1.23, 2.05, 1.6, 1.84, 0.6, 0.57, 1.0, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/cPsIU9BTbcQ_filtered.json b/annotations_filtered/cPsIU9BTbcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..345570b3c60ccd0019e02a111cd90f3c717fa875 --- /dev/null +++ b/annotations_filtered/cPsIU9BTbcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.83], [15.0, 15.77], [17.0, 18.77], [21.0, 31.43], [33.0, 51.19], [53.0, 61.13], [64.0, 64.5], [66.0, 78.8]], "keep_status": [false, false, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 29.16, 32.51, 33.27, 0.0, 34.17], "audiomae_on_audioset": [null, null, null, [["vehicle", 31.49], ["music", 10.71], ["race car, auto racing", 8.39]], [["hum", 28.19], ["mains hum", 12.58], ["vehicle", 10.14]], [["music", 37.38], ["speech", 18.97], ["synthesizer", 13.05]], null, [["music", 35.43], ["throbbing", 6.22], ["hum", 6.08]]], "duration": [1.83, 0.77, 1.77, 10.43, 18.19, 8.13, 0.5, 12.8]} \ No newline at end of file diff --git a/annotations_filtered/cQ_dL_IMPP4_filtered.json b/annotations_filtered/cQ_dL_IMPP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b5fdd6df7c9269fdbe46895dbd553577ae4e4b2 --- /dev/null +++ b/annotations_filtered/cQ_dL_IMPP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.8], [1.0, 2.1], [6.0, 6.69], [12.0, 12.46], [14.0, 16.02], [16.0, 17.37], [24.0, 25.12], [26.0, 26.69], [30.0, 30.7], [35.0, 35.75], [58.0, 82.11], [86.0, 86.12], [87.0, 93.87], [97.0, 97.66], [98.0, 106.15], [107.0, 108.16], [111.0, 111.08], [115.0, 115.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 0.0, 36.08, 0.0, 39.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 58.42], ["theremin", 14.78], ["musical instrument", 4.39]], null, [["music", 50.86], ["speech", 16.55], ["smash, crash", 4.69]], null, [["speech", 55.95], ["music", 16.02], ["didgeridoo", 5.79]], null, null, null], "duration": [-0.2, 1.1, 0.69, 0.46, 2.02, 1.37, 1.12, 0.69, 0.7, 0.75, 24.11, 0.12, 6.87, 0.66, 8.15, 1.16, 0.08, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/cRZ7bc3nqwA_filtered.json b/annotations_filtered/cRZ7bc3nqwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56265cb3018d1f2a53ca4a47c9a75b25f9147d53 --- /dev/null +++ b/annotations_filtered/cRZ7bc3nqwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.79], [50.0, 50.26], [51.0, 52.32], [54.0, 56.57], [60.0, 61.11], [66.0, 68.64], [69.0, 71.49], [72.0, 81.99], [85.0, 112.5], [121.0, 122.98], [125.0, 125.39], [135.0, 138.92], [139.0, 140.85], [147.0, 152.19], [165.0, 164.66], [167.0, 169.28], [170.0, 180.45], [181.0, 183.19]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.13, 0.0, 33.0, 64.75, 31.15, 33.61, 0.0, 0.0, 52.39, 0.0, 57.64, 0.0, 83.88, 37.15, 50.02], "audiomae_on_audioset": [null, null, null, [["hum", 29.24], ["music", 25.0], ["mains hum", 13.97]], null, [["speech", 69.37], ["hum", 8.07], ["music", 3.92]], null, [["music", 34.49], ["hum", 19.83], ["mains hum", 7.6]], [["music", 34.38], ["hum", 8.29], ["speech", 7.92]], null, null, null, null, null, null, null, [["music", 71.89], ["scary music", 7.09], ["ambient music", 3.94]], null], "duration": [1.79, 0.26, 1.32, 2.57, 1.11, 2.64, 2.49, 9.99, 27.5, 1.98, 0.39, 3.92, 1.85, 5.19, -0.34, 2.28, 10.45, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/cRoIsrSzapo_filtered.json b/annotations_filtered/cRoIsrSzapo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8fc6e390466d1daaae70a889c466b5f70d7862a --- /dev/null +++ b/annotations_filtered/cRoIsrSzapo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [6.0, 7.92], [10.0, 12.07], [14.0, 15.84], [17.0, 17.69], [18.0, 18.94], [24.0, 30.86], [32.0, 33.44], [35.0, 40.24], [43.0, 58.85], [61.0, 60.98], [62.0, 65.62], [67.0, 69.15], [73.0, 73.01], [75.0, 79.88], [81.0, 85.01], [87.0, 87.79], [89.0, 90.1], [91.0, 92.16], [93.0, 93.41], [96.0, 96.72], [98.0, 100.36], [102.0, 102.64], [104.0, 104.79], [106.0, 107.37], [109.0, 109.38], [110.0, 111.13], [112.0, 112.21], [113.0, 113.22], [115.0, 118.76]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.75, 0.0, 0.0, 0.0, 32.91, 0.0, 54.63, 30.65, 0.0, 58.81, 99.48, 0.0, 29.7, 31.71, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.85], "audiomae_on_audioset": [null, null, [["siren", 25.36], ["civil defense siren", 18.09], ["music", 5.79]], null, null, null, [["electric shaver, electric razor", 24.11], ["music", 20.81], ["speech", 10.7]], null, null, [["music", 58.62], ["didgeridoo", 22.7], ["sound effect", 1.61]], null, null, null, null, [["speech", 34.81], ["hum", 13.07], ["explosion", 9.78]], [["burping, eructation", 97.9], ["music", 0.25], ["throbbing", 0.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["sound effect", 51.42], ["boing", 8.51], ["whack, thwack", 5.26]]], "duration": [0.55, 1.92, 2.07, 1.84, 0.69, 0.94, 6.86, 1.44, 5.24, 15.85, -0.02, 3.62, 2.15, 0.01, 4.88, 4.01, 0.79, 1.1, 1.16, 0.41, 0.72, 2.36, 0.64, 0.79, 1.37, 0.38, 1.13, 0.21, 0.22, 3.76]} \ No newline at end of file diff --git a/annotations_filtered/cRpMdH1D55o_filtered.json b/annotations_filtered/cRpMdH1D55o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b901190dd83cd1d81433d87da4b87d07cbac3b7c --- /dev/null +++ b/annotations_filtered/cRpMdH1D55o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [5.0, 6.66], [8.0, 33.56], [34.0, 35.33], [36.0, 37.05], [39.0, 38.91], [40.0, 40.93], [42.0, 42.74], [43.0, 44.31], [45.0, 50.45], [53.0, 52.86], [54.0, 58.02], [58.0, 58.24], [58.0, 60.93], [62.0, 65.91], [69.0, 73.09], [76.0, 79.27], [82.0, 96.94], [97.0, 99.57], [100.0, 102.47], [103.0, 113.07], [118.0, 120.53], [122.0, 128.65], [133.0, 137.98], [138.0, 150.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.44, 0.0, 28.56, 0.0, 28.64, 28.66, 28.24, 29.42, 29.06, 42.53, 42.93, 39.7, 37.68, 90.6, 57.48, 94.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 58.8], ["theremin", 11.55], ["ambient music", 3.96]], null, [["foghorn", 47.94], ["music", 23.86], ["gong", 8.35]], null, [["noise", 13.77], ["electric shaver, electric razor", 10.79], ["music", 7.16]], [["music", 26.62], ["foghorn", 7.11], ["hum", 3.96]], [["foghorn", 24.48], ["music", 22.73], ["trombone", 16.63]], [["theremin", 38.67], ["foghorn", 28.93], ["music", 10.83]], [["theremin", 58.48], ["music", 25.22], ["buzz", 5.43]], [["tabla", 33.63], ["music", 17.24], ["musical instrument", 7.81]], [["mains hum", 30.83], ["hum", 25.09], ["music", 18.1]], [["music", 27.25], ["mains hum", 23.89], ["hum", 22.45]], [["speech", 37.07], ["gong", 21.65], ["music", 8.37]], null, null, null], "duration": [1.64, 1.66, 25.56, 1.33, 1.05, -0.09, 0.93, 0.74, 1.31, 5.45, -0.14, 4.02, 0.24, 2.93, 3.91, 4.09, 3.27, 14.94, 2.57, 2.47, 10.07, 2.53, 6.65, 4.98, 12.28]} \ No newline at end of file diff --git a/annotations_filtered/cRsKzW5Fszc_filtered.json b/annotations_filtered/cRsKzW5Fszc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c9aceaa944ec80a52e434bdebcb76b883ee2b3 --- /dev/null +++ b/annotations_filtered/cRsKzW5Fszc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.59], [12.0, 12.82], [13.0, 14.55], [17.0, 17.74], [18.0, 18.91], [19.0, 20.12], [21.0, 25.05], [26.0, 26.47], [27.0, 27.72], [28.0, 28.46], [29.0, 30.32], [32.0, 31.85], [36.0, 37.12], [38.0, 38.96], [40.0, 39.99], [40.0, 41.45], [42.0, 45.32], [46.0, 46.41], [47.0, 47.38], [48.0, 48.51], [49.0, 50.68], [52.0, 52.56], [54.0, 57.01], [58.0, 62.38], [68.0, 69.15], [69.0, 70.24], [70.0, 77.85], [78.0, 78.54], [83.0, 106.07], [106.0, 106.27], [106.0, 112.45], [112.0, 112.48], [113.0, 118.47], [120.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 38.55, 0.0, 0.0, 32.04, 0.0, 31.24, 0.0, 32.25, 0.0, 29.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["bouncing", 47.29], ["speech", 28.17], ["whack, thwack", 2.34]], null, null, [["speech", 80.59], ["clip-clop", 2.14], ["radio", 1.73]], null, [["music", 50.65], ["speech", 17.91], ["musical instrument", 6.79]], null, [["music", 69.66], ["musical instrument", 3.37], ["speech", 3.12]], null, [["music", 55.57], ["boing", 11.26], ["smash, crash", 8.5]], null], "duration": [1.59, 0.82, 1.55, 0.74, 0.91, 1.12, 4.05, 0.47, 0.72, 0.46, 1.32, -0.15, 1.12, 0.96, -0.01, 1.45, 3.32, 0.41, 0.38, 0.51, 1.68, 0.56, 3.01, 4.38, 1.15, 1.24, 7.85, 0.54, 23.07, 0.27, 6.45, 0.48, 5.47, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/cRuYB2gXpM8_filtered.json b/annotations_filtered/cRuYB2gXpM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b210b65d989f447b83efd6c1aadb8e6afffc8957 --- /dev/null +++ b/annotations_filtered/cRuYB2gXpM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [8.0, 11.67], [12.0, 12.97], [15.0, 14.84], [15.0, 15.77], [17.0, 42.5], [44.0, 73.94], [76.0, 91.34], [93.0, 106.22], [111.0, 111.25], [112.0, 122.89], [124.0, 130.54], [131.0, 173.16], [174.0, 174.07]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.82, 0.0, 0.0, 0.0, 31.91, 33.53, 41.98, 46.26, 0.0, 41.22, 59.59, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.3], ["hum", 13.57], ["music", 10.12]], null, null, null, [["throbbing", 46.12], ["music", 34.84], ["hum", 13.09]], [["hum", 16.11], ["throbbing", 13.37], ["music", 9.37]], [["mains hum", 34.2], ["hum", 31.87], ["music", 14.35]], [["music", 39.24], ["hum", 18.36], ["mains hum", 15.59]], null, [["hum", 56.41], ["music", 15.29], ["mains hum", 12.6]], null, null, null], "duration": [0.72, 3.67, 0.97, -0.16, 0.77, 25.5, 29.94, 15.34, 13.22, 0.25, 10.89, 6.54, 42.16, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/cS3cT6vgiT4_filtered.json b/annotations_filtered/cS3cT6vgiT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fea9e4df1f062fc56fbe04e51fb4093320f4375 --- /dev/null +++ b/annotations_filtered/cS3cT6vgiT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [5.0, 6.03], [7.0, 7.96], [9.0, 9.83], [10.0, 10.67], [16.0, 16.9], [18.0, 18.35], [20.0, 23.33], [25.0, 26.27], [27.0, 27.85], [29.0, 29.42], [36.0, 36.49], [37.0, 37.99], [41.0, 41.55], [42.0, 42.74]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 49.69], ["speech", 8.7], ["radio", 5.53]], null, null, null, null, null, null, null], "duration": [0.76, 1.03, 0.96, 0.83, 0.67, 0.9, 0.35, 3.33, 1.27, 0.85, 0.42, 0.49, 0.99, 0.55, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/cSO2u-StPbY_filtered.json b/annotations_filtered/cSO2u-StPbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30a9a63a5ecf773e526f8e0b9073d334d575b1a9 --- /dev/null +++ b/annotations_filtered/cSO2u-StPbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 44.81], [70.0, 70.85], [75.0, 86.19]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.39], "audiomae_on_audioset": [null, null, [["hum", 30.18], ["music", 22.53], ["mains hum", 17.62]]], "duration": [-0.19, 0.85, 11.19]} \ No newline at end of file diff --git a/annotations_filtered/cSSYFjtc4SY_filtered.json b/annotations_filtered/cSSYFjtc4SY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ce2abf7987ad030441f46da459f63936bb87cf6 --- /dev/null +++ b/annotations_filtered/cSSYFjtc4SY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.59], [20.0, 20.78], [22.0, 22.45], [23.0, 23.28], [24.0, 35.23], [38.0, 43.28], [44.0, 103.01], [104.0, 104.82], [105.0, 105.46], [107.0, 107.27], [108.0, 108.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.34, 0.0, 0.0, 0.0, 85.72, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [13.59, 0.78, 0.45, 0.28, 11.23, 5.28, 59.01, 0.82, 0.46, 0.27, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/cSUVLAM8jx0_filtered.json b/annotations_filtered/cSUVLAM8jx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ee87574cae486956851a5f8f2fdea807848d56a --- /dev/null +++ b/annotations_filtered/cSUVLAM8jx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [3.0, 2.91], [4.0, 5.37], [7.0, 7.4], [11.0, 11.43], [13.0, 14.32], [27.0, 27.62], [28.0, 28.59], [35.0, 36.44], [39.0, 44.81], [48.0, 48.51], [53.0, 53.82], [70.0, 71.56], [74.0, 74.83], [75.0, 75.66], [78.0, 78.48], [86.0, 85.95], [89.0, 88.8], [89.0, 90.39], [95.0, 95.2], [96.0, 96.63], [105.0, 105.33], [106.0, 124.31], [127.0, 130.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.08, 71.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.59], ["speech", 22.57], ["hum", 4.0]], null], "duration": [0.13, -0.09, 1.37, 0.4, 0.43, 1.32, 0.62, 0.59, 1.44, 5.81, 0.51, 0.82, 1.56, 0.83, 0.66, 0.48, -0.05, -0.2, 1.39, 0.2, 0.63, 0.33, 18.31, 3.79]} \ No newline at end of file diff --git a/annotations_filtered/cSWMU_rISfw_filtered.json b/annotations_filtered/cSWMU_rISfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c906df72c1b2c91ca1ab461a69e57f22c88db1 --- /dev/null +++ b/annotations_filtered/cSWMU_rISfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 100.45], [101.0, 101.85], [102.0, 106.14]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 32.02], "audiomae_on_audioset": [null, null, [["fart", 42.83], ["fly, housefly", 13.73], ["mosquito", 13.67]]], "duration": [76.45, 0.85, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/cT1iUwGGUAg_filtered.json b/annotations_filtered/cT1iUwGGUAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ce3858c3fc88a731294350d18d2414de9151a7 --- /dev/null +++ b/annotations_filtered/cT1iUwGGUAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [17.0, 17.19], [19.0, 19.25], [21.0, 21.05], [23.0, 23.38], [24.0, 24.78], [26.0, 27.24], [32.0, 32.48], [54.0, 54.58], [56.0, 57.75], [60.0, 60.02], [61.0, 61.18], [66.0, 66.83], [68.0, 68.22], [80.0, 80.91], [82.0, 82.39], [85.0, 85.02], [89.0, 89.53], [91.0, 91.37], [93.0, 93.41], [95.0, 95.4], [96.0, 97.07], [100.0, 100.57], [101.0, 101.43], [103.0, 103.55], [104.0, 104.33], [107.0, 107.01], [111.0, 111.74], [114.0, 116.73], [127.0, 128.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 0.19, 0.25, 0.05, 0.38, 0.78, 1.24, 0.48, 0.58, 1.75, 0.02, 0.18, 0.83, 0.22, 0.91, 0.39, 0.02, 0.53, 0.37, 0.41, 0.4, 1.07, 0.57, 0.43, 0.55, 0.33, 0.01, 0.74, 2.73, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/cTQRH6MPV3A_filtered.json b/annotations_filtered/cTQRH6MPV3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23a0e232eb2dfbe8cbb00d47e05226abcd20d1ed --- /dev/null +++ b/annotations_filtered/cTQRH6MPV3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.71], [9.0, 8.87], [9.0, 9.64], [17.0, 17.56], [19.0, 20.07], [20.0, 21.42], [26.0, 26.22], [28.0, 30.01], [34.0, 38.75], [46.0, 46.16], [47.0, 46.99], [51.0, 51.29], [53.0, 57.47], [73.0, 76.74], [80.0, 83.25], [86.0, 86.9], [107.0, 106.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 81.71, 0.0, 0.0, 0.0, 99.98, 96.89, 99.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, -0.13, 0.64, 0.56, 1.07, 1.42, 0.22, 2.01, 4.75, 0.16, -0.01, 0.29, 4.47, 3.74, 3.25, 0.9, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/cTR9Hnxfk7A_filtered.json b/annotations_filtered/cTR9Hnxfk7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d8463d6fe304ad9a03c7bda6ebef068a1f75e96 --- /dev/null +++ b/annotations_filtered/cTR9Hnxfk7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [9.0, 9.85], [12.0, 13.12], [15.0, 15.21], [18.0, 18.96], [20.0, 20.83], [22.0, 23.21], [26.0, 27.75], [29.0, 29.74], [34.0, 34.94], [36.0, 36.63], [42.0, 45.5], [46.0, 49.67], [53.0, 53.67], [55.0, 58.13], [59.0, 62.65], [65.0, 65.16], [66.0, 67.34], [68.0, 68.74], [72.0, 71.98], [73.0, 73.7], [75.0, 75.74], [78.0, 78.09], [79.0, 80.13], [92.0, 93.65], [95.0, 95.79], [101.0, 101.9], [104.0, 107.25], [111.0, 112.53], [113.0, 114.39], [119.0, 121.09], [122.0, 122.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 45.3, 0.0, 43.85, 44.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 99.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.9], ["sidetone", 22.27], ["busy signal", 7.36]], [["fart", 32.77], ["hum", 9.97], ["speech", 7.89]], null, [["stomach rumble", 69.63], ["speech", 14.41], ["fart", 1.67]], [["hum", 47.94], ["throbbing", 11.45], ["mains hum", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.85, 1.12, 0.21, 0.96, 0.83, 1.21, 1.75, 0.74, 0.94, 0.63, 3.5, 3.67, 0.67, 3.13, 3.65, 0.16, 1.34, 0.74, -0.02, 0.7, 0.74, 0.09, 1.13, 1.65, 0.79, 0.9, 3.25, 1.53, 1.39, 2.09, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/cUEc9ZF3G3M_filtered.json b/annotations_filtered/cUEc9ZF3G3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8914b22e36c568f662307b4f17d1e656a668fe49 --- /dev/null +++ b/annotations_filtered/cUEc9ZF3G3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.68], [21.0, 22.52], [24.0, 25.98], [29.0, 30.4], [33.0, 34.37], [35.0, 35.8], [38.0, 38.62], [39.0, 40.42], [43.0, 43.75], [45.0, 45.81], [47.0, 47.09], [50.0, 51.04], [53.0, 53.79], [56.0, 56.69], [59.0, 60.1], [65.0, 65.11], [67.0, 68.08], [69.0, 70.28], [72.0, 72.67], [76.0, 76.74], [84.0, 85.21], [86.0, 86.54], [89.0, 89.06], [90.0, 91.15], [92.0, 92.6], [94.0, 94.56], [96.0, 96.97], [100.0, 100.14], [102.0, 102.19], [103.0, 103.82], [107.0, 108.09], [111.0, 112.38], [114.0, 114.78], [116.0, 116.97], [120.0, 122.39], [126.0, 133.32], [135.0, 137.1], [140.0, 141.3], [143.0, 143.31], [144.0, 144.96], [146.0, 146.38], [147.0, 147.18], [149.0, 149.79], [150.0, 150.85], [151.0, 152.17], [153.0, 154.47], [155.0, 157.23], [158.0, 159.6], [161.0, 161.55], [163.0, 163.63], [165.0, 165.48], [167.0, 168.42], [171.0, 174.02], [175.0, 175.09], [176.0, 176.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.52, 1.98, 1.4, 1.37, 0.8, 0.62, 1.42, 0.75, 0.81, 0.09, 1.04, 0.79, 0.69, 1.1, 0.11, 1.08, 1.28, 0.67, 0.74, 1.21, 0.54, 0.06, 1.15, 0.6, 0.56, 0.97, 0.14, 0.19, 0.82, 1.09, 1.38, 0.78, 0.97, 2.39, 7.32, 2.1, 1.3, 0.31, 0.96, 0.38, 0.18, 0.79, 0.85, 1.17, 1.47, 2.23, 1.6, 0.55, 0.63, 0.48, 1.42, 3.02, 0.09, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/cUQZVnerwI0_filtered.json b/annotations_filtered/cUQZVnerwI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b6f7b0d9f0decdba3eb504f662aca62d4af702 --- /dev/null +++ b/annotations_filtered/cUQZVnerwI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.37], [27.0, 28.98], [29.0, 44.47], [45.0, 46.8], [49.0, 53.49], [54.0, 55.21], [57.0, 57.4], [58.0, 59.27], [61.0, 63.51], [66.0, 67.59], [69.0, 69.36], [72.0, 73.63], [78.0, 78.95], [84.0, 110.56], [117.0, 117.61], [118.0, 118.69], [120.0, 120.78], [124.0, 124.98], [126.0, 126.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.87, 0.0, 90.78, 0.0, 86.45, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 0.0, 38.84, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.83], ["hum", 13.55], ["synthesizer", 6.98]], null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 51.55], ["speech", 25.53], ["sine wave", 4.54]], null, null, null, null, null], "duration": [13.37, 1.98, 15.47, 1.8, 4.49, 1.21, 0.4, 1.27, 2.51, 1.59, 0.36, 1.63, 0.95, 26.56, 0.61, 0.69, 0.78, 0.98, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/cUT0WQ9cTrg_filtered.json b/annotations_filtered/cUT0WQ9cTrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ab1b808bb3910f4f92894c60ba8b4f8ff33bd03 --- /dev/null +++ b/annotations_filtered/cUT0WQ9cTrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [3.0, 10.07], [17.0, 25.76], [30.0, 31.95], [42.0, 44.74], [48.0, 48.36], [49.0, 51.07], [57.0, 56.89], [62.0, 63.14], [79.0, 79.02], [85.0, 86.16], [89.0, 94.44], [100.0, 103.64], [104.0, 105.22], [106.0, 108.16]], "keep_status": [false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.28, 31.12, 0.0, 32.75, 0.0, 33.83, 0.0, 0.0, 0.0, 0.0, 34.01, 74.44, 0.0, 91.47], "audiomae_on_audioset": [null, [["cattle, bovinae", 24.87], ["moo", 23.05], ["music", 11.62]], [["music", 35.02], ["hum", 24.34], ["throbbing", 12.26]], null, [["music", 40.82], ["speech", 8.96], ["sidetone", 6.11]], null, [["music", 39.19], ["electronic music", 10.38], ["dubstep", 5.06]], null, null, null, null, [["mosquito", 48.37], ["crushing", 13.7], ["music", 8.46]], null, null, null], "duration": [0.79, 7.07, 8.76, 1.95, 2.74, 0.36, 2.07, -0.11, 1.14, 0.02, 1.16, 5.44, 3.64, 1.22, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/cUX2Mj4SN7o_filtered.json b/annotations_filtered/cUX2Mj4SN7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c053d0ef26839c184c90ac2f86756f5969a5a43 --- /dev/null +++ b/annotations_filtered/cUX2Mj4SN7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 78.21], [81.0, 95.5], [100.0, 106.32], [108.0, 111.75], [113.0, 121.86], [122.0, 121.91], [123.0, 124.73]], "keep_status": [true, false, true, false, false, false, false], "silence_prob": [38.27, 32.15, 32.91, 45.72, 34.08, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 28.61], ["music", 19.05], ["hum", 4.24]], [["music", 69.54], ["throbbing", 3.44], ["hum", 3.19]], [["hum", 18.85], ["music", 17.99], ["vehicle", 11.05]], [["music", 78.13], ["mains hum", 3.42], ["synthesizer", 3.16]], [["music", 58.88], ["theremin", 19.39], ["synthesizer", 3.91]], null, null], "duration": [7.21, 14.5, 6.32, 3.75, 8.86, -0.09, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/cV9dlsOzyVc_filtered.json b/annotations_filtered/cV9dlsOzyVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ccde0266eb4da7a3559250514554a086330b0d0 --- /dev/null +++ b/annotations_filtered/cV9dlsOzyVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [14.0, 20.38], [25.0, 25.69], [27.0, 29.27], [31.0, 31.53], [33.0, 34.75], [38.0, 38.48], [50.0, 51.19], [52.0, 52.84], [61.0, 60.99], [62.0, 62.6], [64.0, 63.69], [67.0, 70.19], [74.0, 83.07], [83.0, 84.84], [85.0, 87.94], [89.0, 89.41], [91.0, 91.56], [92.0, 95.64], [97.0, 97.63], [100.0, 101.43], [104.0, 104.18], [107.0, 107.1], [111.0, 113.05], [119.0, 119.8], [130.0, 134.28], [136.0, 136.34], [139.0, 141.02], [145.0, 144.8], [149.0, 150.6], [151.0, 151.23], [152.0, 153.81], [155.0, 162.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [38.79, 32.76, 0.0, 34.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.66, 31.31, 0.0, 48.61, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 99.68, 0.0, 37.75, 0.0, 0.0, 0.0, 0.0, 33.63], "audiomae_on_audioset": [[["music", 80.22], ["synthesizer", 3.98], ["musical instrument", 2.08]], [["music", 43.48], ["throbbing", 16.96], ["synthesizer", 11.44]], null, [["speech", 25.66], ["whale vocalization", 16.88], ["water", 12.91]], null, null, null, null, null, null, null, null, [["music", 40.75], ["speech", 16.15], ["scratching (performance technique)", 6.62]], [["music", 77.84], ["electronic music", 4.02], ["didgeridoo", 2.83]], null, [["speech", 27.01], ["sidetone", 14.98], ["music", 6.84]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.4], ["music", 30.22], ["inside, small room", 3.16]], null, null, null, null, [["music", 48.31], ["guitar", 11.15], ["effects unit", 10.23]]], "duration": [3.17, 6.38, 0.69, 2.27, 0.53, 1.75, 0.48, 1.19, 0.84, -0.01, 0.6, -0.31, 3.19, 9.07, 1.84, 2.94, 0.41, 0.56, 3.64, 0.63, 1.43, 0.18, 0.1, 2.05, 0.8, 4.28, 0.34, 2.02, -0.2, 1.6, 0.23, 1.81, 7.14]} \ No newline at end of file diff --git a/annotations_filtered/cVA4BO2v7zs_filtered.json b/annotations_filtered/cVA4BO2v7zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65f5647e9c8e90faa038709d6212c52255293f5f --- /dev/null +++ b/annotations_filtered/cVA4BO2v7zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.66], [14.0, 20.85], [22.0, 23.09], [24.0, 24.98], [25.0, 26.69], [27.0, 29.25], [30.0, 32.39], [34.0, 34.65], [35.0, 35.9], [38.0, 37.84], [46.0, 46.97], [48.0, 48.96], [50.0, 52.17], [52.0, 52.84], [54.0, 53.96], [55.0, 56.2], [57.0, 69.4], [70.0, 87.39]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [45.3, 63.96, 0.0, 0.0, 0.0, 95.23, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 45.21, 29.71], "audiomae_on_audioset": [[["music", 39.5], ["hum", 11.94], ["throbbing", 5.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.18], ["synthesizer", 7.79], ["electronic music", 3.14]], [["music", 62.03], ["sound effect", 3.64], ["didgeridoo", 3.24]]], "duration": [6.66, 6.85, 1.09, 0.98, 1.69, 2.25, 2.39, 0.65, 0.9, -0.16, 0.97, 0.96, 2.17, 0.84, -0.04, 1.2, 12.4, 17.39]} \ No newline at end of file diff --git a/annotations_filtered/cVIS31ghLNQ_filtered.json b/annotations_filtered/cVIS31ghLNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37d9829078a54a6317ed44483802009ec65d8de0 --- /dev/null +++ b/annotations_filtered/cVIS31ghLNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.64], [36.0, 67.58], [70.0, 69.67], [70.0, 71.41], [74.0, 80.42], [83.0, 85.6], [89.0, 89.7], [100.0, 116.09], [119.0, 119.79], [120.0, 134.64], [138.0, 141.94], [150.0, 150.5], [151.0, 151.01], [152.0, 155.44], [156.0, 166.72], [168.0, 169.96]], "keep_status": [false, false, false, false, true, false, false, true, false, true, false, false, false, true, true, false], "silence_prob": [34.67, 0.0, 0.0, 0.0, 31.2, 30.68, 0.0, 30.34, 0.0, 30.83, 34.26, 0.0, 0.0, 31.13, 44.93, 0.0], "audiomae_on_audioset": [[["music", 73.01], ["musical instrument", 13.29], ["didgeridoo", 2.97]], null, null, null, [["music", 13.85], ["mosquito", 10.18], ["fly, housefly", 9.01]], [["whale vocalization", 35.18], ["speech", 18.14], ["music", 17.92]], null, [["music", 44.44], ["synthesizer", 7.15], ["cacophony", 5.54]], null, [["speech", 35.2], ["vehicle", 10.45], ["music", 8.57]], [["music", 36.54], ["speech", 26.72], ["throbbing", 10.11]], null, null, [["music", 43.64], ["speech", 12.67], ["sidetone", 4.36]], [["music", 23.57], ["throbbing", 17.49], ["hum", 16.86]], null], "duration": [3.64, 31.58, -0.33, 1.41, 6.42, 2.6, 0.7, 16.09, 0.79, 14.64, 3.94, 0.5, 0.01, 3.44, 10.72, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/cVPTibn-ewI_filtered.json b/annotations_filtered/cVPTibn-ewI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13de3a72d5eca36df37ac54ff4f8ffdac3d6577d --- /dev/null +++ b/annotations_filtered/cVPTibn-ewI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 53.62], [55.0, 62.61], [64.0, 64.02], [65.0, 65.91], [67.0, 68.03], [69.0, 69.26], [70.0, 70.46], [71.0, 73.94], [76.0, 79.84], [86.0, 104.97], [106.0, 106.86], [110.0, 112.48], [114.0, 129.19], [133.0, 137.57], [139.0, 139.82], [145.0, 145.47], [146.0, 147.48], [149.0, 150.04], [151.0, 152.76], [154.0, 161.54], [163.0, 163.9], [168.0, 212.21]], "keep_status": [false, true, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.82, 0.0, 0.0, 0.0, 0.0, 0.0, 36.8, 42.02, 35.05, 0.0, 55.81, 67.38, 59.86, 0.0, 0.0, 0.0, 0.0, 0.0, 51.28, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 45.48], ["sidetone", 8.68], ["hum", 5.02]], null, null, null, null, null, [["speech", 18.46], ["crowd", 15.82], ["run", 5.32]], [["speech", 43.83], ["whale vocalization", 5.42], ["hubbub, speech noise, speech babble", 4.56]], [["gunshot, gunfire", 29.24], ["artillery fire", 22.49], ["speech", 14.24]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 7.61, 0.02, 0.91, 1.03, 0.26, 0.46, 2.94, 3.84, 18.97, 0.86, 2.48, 15.19, 4.57, 0.82, 0.47, 1.48, 1.04, 1.76, 7.54, 0.9, 44.21]} \ No newline at end of file diff --git a/annotations_filtered/cW23WpOvC6A_filtered.json b/annotations_filtered/cW23WpOvC6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f846b2d60cde779edbd979567e7219ccc9141a3 --- /dev/null +++ b/annotations_filtered/cW23WpOvC6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.5], [21.0, 21.78], [28.0, 38.23], [40.0, 40.15], [40.0, 41.5], [42.0, 41.54], [44.0, 46.97], [47.0, 51.51], [55.0, 54.53], [55.0, 54.57], [55.0, 54.6], [55.0, 54.9], [55.0, 54.94], [58.0, 62.06], [72.0, 77.87], [82.0, 95.32]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 29.04, 29.26, 0.0, 0.0, 0.0, 0.0, 0.0, 28.9, 29.1, 28.67], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 38.61], ["cattle, bovinae", 28.57], ["moo", 23.43]], null, null, null, [["music", 50.12], ["didgeridoo", 5.36], ["reverberation", 4.94]], [["music", 70.79], ["didgeridoo", 4.58], ["funk", 4.41]], null, null, null, null, null, [["music", 72.29], ["didgeridoo", 10.33], ["musical instrument", 2.69]], [["music", 87.77], ["theremin", 1.96], ["carnatic music", 1.86]], [["sheep", 20.78], ["music", 16.07], ["bleat", 14.05]]], "duration": [0.5, 0.78, 10.23, 0.15, 1.5, -0.46, 2.97, 4.51, -0.47, -0.43, -0.4, -0.1, -0.06, 4.06, 5.87, 13.32]} \ No newline at end of file diff --git a/annotations_filtered/cW7AkQihsa8_filtered.json b/annotations_filtered/cW7AkQihsa8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..314267814bd01d59661c247723bcdb4655fb22a4 --- /dev/null +++ b/annotations_filtered/cW7AkQihsa8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [8.0, 8.41], [10.0, 11.45], [15.0, 16.04], [19.0, 25.44], [27.0, 27.82], [30.0, 30.55], [31.0, 49.17], [50.0, 50.9], [54.0, 54.31], [56.0, 57.03], [58.0, 58.83], [64.0, 64.15], [64.0, 64.96], [67.0, 67.24], [67.0, 68.15], [69.0, 70.73], [73.0, 73.3], [74.0, 75.03], [87.0, 87.72], [95.0, 96.25], [104.0, 104.97], [108.0, 108.23], [111.0, 110.94], [116.0, 116.28], [119.0, 119.87], [127.0, 127.58], [134.0, 133.62], [154.0, 154.5], [184.0, 183.79]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.57, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 70.57], ["radio", 6.92], ["music", 5.66]], null, null, [["creak", 34.6], ["fart", 24.85], ["glass", 7.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 0.41, 1.45, 1.04, 6.44, 0.82, 0.55, 18.17, 0.9, 0.31, 1.03, 0.83, 0.15, 0.96, 0.24, 1.15, 1.73, 0.3, 1.03, 0.72, 1.25, 0.97, 0.23, -0.06, 0.28, 0.87, 0.58, -0.38, 0.5, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/cW7Q7UySxRA_filtered.json b/annotations_filtered/cW7Q7UySxRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf0e21cc8ad07ec897d6b5aae2555045116c09cd --- /dev/null +++ b/annotations_filtered/cW7Q7UySxRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 46.35], [54.0, 80.76], [81.0, 109.95], [110.0, 123.31], [124.0, 138.92]], "keep_status": [false, true, false, false, false], "silence_prob": [32.57, 35.41, 32.83, 29.78, 29.72], "audiomae_on_audioset": [[["music", 68.57], ["timpani", 4.65], ["musical instrument", 4.04]], [["music", 34.37], ["rumble", 7.1], ["hum", 6.04]], [["music", 51.8], ["timpani", 17.45], ["musical instrument", 5.09]], [["music", 59.8], ["brass instrument", 6.87], ["musical instrument", 6.11]], [["music", 81.56], ["musical instrument", 4.07], ["theremin", 4.02]]], "duration": [4.35, 26.76, 28.95, 13.31, 14.92]} \ No newline at end of file diff --git a/annotations_filtered/cWMP0aAueQY_filtered.json b/annotations_filtered/cWMP0aAueQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b888bd3a4ab662cf51cdfb90bda451b5651b7c6 --- /dev/null +++ b/annotations_filtered/cWMP0aAueQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [4.0, 5.09], [6.0, 6.52], [11.0, 11.89], [14.0, 47.63], [49.0, 49.27], [51.0, 51.85], [56.0, 57.77], [58.0, 79.17], [86.0, 88.28], [90.0, 90.85], [91.0, 92.15], [94.0, 95.42], [102.0, 108.45], [113.0, 113.75], [115.0, 118.18], [128.0, 129.1], [133.0, 139.36], [139.0, 139.48], [140.0, 140.41], [141.0, 140.95], [142.0, 147.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 86.27, 0.0, 0.0, 0.0, 46.4, 0.0, 36.59, 0.0, 48.19, 0.0, 0.0, 0.0, 54.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.47], ["thunk", 14.05], ["door", 6.51]], null, [["music", 42.2], ["speech", 23.88], ["boing", 12.64]], null, [["speech", 48.97], ["radio", 20.35], ["noise", 8.84]], null, null, null, null], "duration": [0.8, 1.09, 0.52, 0.89, 33.63, 0.27, 0.85, 1.77, 21.17, 2.28, 0.85, 1.15, 1.42, 6.45, 0.75, 3.18, 1.1, 6.36, 0.48, 0.41, -0.05, 5.07]} \ No newline at end of file diff --git a/annotations_filtered/cWYIlga8sas_filtered.json b/annotations_filtered/cWYIlga8sas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f782e2714516f0412ee21bbc8bd8602275a46a15 --- /dev/null +++ b/annotations_filtered/cWYIlga8sas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[161.0, 164.74]], "keep_status": [true], "silence_prob": [38.79], "audiomae_on_audioset": [[["sonar", 31.78], ["music", 26.05], ["sound effect", 5.8]]], "duration": [3.74]} \ No newline at end of file diff --git a/annotations_filtered/cWiljyh4NR4_filtered.json b/annotations_filtered/cWiljyh4NR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c59e033d3e8581923e08d06e19030c96dabd142c --- /dev/null +++ b/annotations_filtered/cWiljyh4NR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [3.0, 3.35], [4.0, 4.04], [4.0, 4.7], [5.0, 5.97], [6.0, 7.62], [8.0, 8.75], [9.0, 12.14], [14.0, 14.17], [15.0, 15.89], [17.0, 17.05], [18.0, 19.8], [21.0, 21.83], [23.0, 105.31], [106.0, 107.45], [108.0, 111.43], [113.0, 113.44], [114.0, 116.78], [120.0, 120.58], [122.0, 122.89], [124.0, 126.74], [128.0, 128.51], [129.0, 130.52], [132.0, 132.31], [134.0, 134.86], [136.0, 136.83], [139.0, 139.04], [140.0, 148.14], [152.0, 157.05], [159.0, 166.56], [168.0, 173.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 55.11, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.22, 68.02, 69.88, 66.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.35, 0.04, 0.7, 0.97, 1.62, 0.75, 3.14, 0.17, 0.89, 0.05, 1.8, 0.83, 82.31, 1.45, 3.43, 0.44, 2.78, 0.58, 0.89, 2.74, 0.51, 1.52, 0.31, 0.86, 0.83, 0.04, 8.14, 5.05, 7.56, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/cWj-sdxFiY4_filtered.json b/annotations_filtered/cWj-sdxFiY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ca7ab3c421af14502b6d43e69c3693d558cc7f --- /dev/null +++ b/annotations_filtered/cWj-sdxFiY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.02], [9.0, 9.05], [9.0, 9.09], [9.0, 9.12], [9.0, 9.19], [9.0, 83.61], [86.0, 91.57], [92.0, 95.49], [100.0, 106.61], [111.0, 122.54]], "keep_status": [false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.61, 29.74, 29.6, 29.56], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.1], ["vehicle", 29.16], ["car", 19.02]], [["music", 39.05], ["throbbing", 15.75], ["hum", 11.26]], [["vehicle", 38.08], ["speech", 34.98], ["car", 11.61]], [["vehicle", 23.32], ["car", 17.74], ["race car, auto racing", 10.13]]], "duration": [0.02, 0.05, 0.09, 0.12, 0.19, 74.61, 5.57, 3.49, 6.61, 11.54]} \ No newline at end of file diff --git a/annotations_filtered/cWuFfrettMY_filtered.json b/annotations_filtered/cWuFfrettMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c55c8bc929f80185cbd2d3d483eee871125077c --- /dev/null +++ b/annotations_filtered/cWuFfrettMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 19.62], [21.0, 22.86], [25.0, 26.7], [27.0, 42.2], [44.0, 45.52], [47.0, 49.84], [51.0, 56.89], [59.0, 61.72], [63.0, 69.65], [70.0, 71.42], [73.0, 74.33], [75.0, 77.33], [80.0, 79.98], [83.0, 84.67], [86.0, 88.45]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [45.18, 0.0, 0.0, 62.37, 0.0, 84.07, 42.91, 88.83, 86.09, 0.0, 0.0, 34.9, 0.0, 0.0, 86.09], "audiomae_on_audioset": [[["frog", 47.27], ["fly, housefly", 10.8], ["speech", 7.62]], null, null, null, null, null, [["speech", 34.32], ["sine wave", 16.73], ["sidetone", 9.97]], null, null, null, null, [["cattle, bovinae", 33.04], ["moo", 24.49], ["livestock, farm animals, working animals", 20.39]], null, null, null], "duration": [7.62, 1.86, 1.7, 15.2, 1.52, 2.84, 5.89, 2.72, 6.65, 1.42, 1.33, 2.33, -0.02, 1.67, 2.45]} \ No newline at end of file diff --git a/annotations_filtered/cXCMz340CRg_filtered.json b/annotations_filtered/cXCMz340CRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75010b83fee156f32ecfb24c02e693a75d458397 --- /dev/null +++ b/annotations_filtered/cXCMz340CRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.05], [7.0, 8.16], [11.0, 17.19], [19.0, 20.38], [23.0, 23.92], [25.0, 26.96], [27.0, 44.73], [52.0, 54.23], [58.0, 58.09], [61.0, 63.41], [68.0, 68.01], [72.0, 88.82], [91.0, 115.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [59.24, 0.0, 61.87, 0.0, 0.0, 0.0, 43.71, 42.65, 0.0, 41.62, 0.0, 31.66, 33.71], "audiomae_on_audioset": [null, null, null, null, null, null, [["throbbing", 57.96], ["hum", 22.27], ["music", 6.0]], [["speech", 21.05], ["hum", 10.05], ["fly, housefly", 6.32]], null, [["hum", 41.54], ["throbbing", 38.06], ["mains hum", 4.82]], null, [["speech", 34.54], ["music", 23.1], ["explosion", 8.95]], [["music", 53.08], ["throbbing", 11.06], ["theremin", 7.16]]], "duration": [2.05, 1.16, 6.19, 1.38, 0.92, 1.96, 17.73, 2.23, 0.09, 2.41, 0.01, 16.82, 24.33]} \ No newline at end of file diff --git a/annotations_filtered/cXfD-Ai_QuA_filtered.json b/annotations_filtered/cXfD-Ai_QuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ce519987b2a9a606b3f1bb3c5410a7207ea1d57 --- /dev/null +++ b/annotations_filtered/cXfD-Ai_QuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.84], [29.0, 30.25], [32.0, 33.64], [35.0, 36.07], [38.0, 52.12], [54.0, 55.22], [57.0, 57.92], [60.0, 60.54], [62.0, 62.92], [64.0, 65.2], [69.0, 70.48], [72.0, 73.36], [74.0, 74.26], [78.0, 80.01], [80.0, 80.05], [81.0, 81.31], [85.0, 85.68], [90.0, 90.95], [94.0, 99.74], [100.0, 100.65], [101.0, 101.34], [103.0, 103.86], [104.0, 107.01], [109.0, 112.62], [114.0, 115.13], [117.0, 117.9], [120.0, 120.26], [128.0, 128.44], [134.0, 134.77], [139.0, 141.05], [142.0, 144.86], [145.0, 144.9], [145.0, 144.93], [145.0, 146.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 64.29, 53.34, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 85.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["dial tone", 23.3], ["sidetone", 22.37], ["sine wave", 21.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.84, 1.25, 1.64, 1.07, 14.12, 1.22, 0.92, 0.54, 0.92, 1.2, 1.48, 1.36, 0.26, 2.01, 0.05, 0.31, 0.68, 0.95, 5.74, 0.65, 0.34, 0.86, 3.01, 3.62, 1.13, 0.9, 0.26, 0.44, 0.77, 2.05, 2.86, -0.1, -0.07, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/cXlRo6pJ9ig_filtered.json b/annotations_filtered/cXlRo6pJ9ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf3539815930ea86ea22f218bd30495cdd3813ac --- /dev/null +++ b/annotations_filtered/cXlRo6pJ9ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.87], [26.0, 26.45], [26.0, 39.41], [46.0, 47.44], [48.0, 48.24], [49.0, 50.52], [52.0, 53.65], [66.0, 66.8], [68.0, 68.77], [73.0, 76.15], [77.0, 78.29], [80.0, 82.73], [84.0, 85.95], [86.0, 88.03], [89.0, 88.6], [89.0, 90.34], [91.0, 93.16], [96.0, 95.59], [96.0, 96.7], [97.0, 98.71], [99.0, 128.01], [130.0, 131.33], [134.0, 136.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [50.21, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 97.11, 0.0, 93.45, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 31.0, 0.0, 40.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.94], ["speech", 21.87], ["gunshot, gunfire", 4.38]], null, [["music", 30.02], ["gong", 10.22], ["ambient music", 9.77]]], "duration": [5.87, 0.45, 13.41, 1.44, 0.24, 1.52, 1.65, 0.8, 0.77, 3.15, 1.29, 2.73, 1.95, 2.03, -0.4, 1.34, 2.16, -0.41, 0.7, 1.71, 29.01, 1.33, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/cXm_h4Zdwpc_filtered.json b/annotations_filtered/cXm_h4Zdwpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..184f584d2d16f988ae7ee557429bd8caea9b06f4 --- /dev/null +++ b/annotations_filtered/cXm_h4Zdwpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.13], [15.0, 16.9], [19.0, 19.85], [21.0, 21.3], [22.0, 23.28], [24.0, 25.74], [27.0, 33.07], [34.0, 35.18], [36.0, 36.56], [37.0, 42.38], [46.0, 46.95], [48.0, 49.77], [50.0, 51.98], [53.0, 53.38], [55.0, 56.03], [57.0, 58.18], [60.0, 63.04], [64.0, 67.41], [79.0, 80.25], [84.0, 90.64], [98.0, 98.9], [101.0, 101.02], [102.0, 104.08], [106.0, 108.21], [111.0, 120.01], [121.0, 121.85], [125.0, 126.33], [129.0, 129.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 46.9, 0.0, 0.0, 77.53, 46.26, 43.08, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.48], ["theremin", 9.79], ["musical instrument", 4.32]], null, null, null, [["foghorn", 36.94], ["music", 35.29], ["theremin", 3.26]], [["music", 51.68], ["synthesizer", 9.16], ["musical instrument", 6.86]], null, null, null], "duration": [2.13, 1.9, 0.85, 0.3, 1.28, 1.74, 6.07, 1.18, 0.56, 5.38, 0.95, 1.77, 1.98, 0.38, 1.03, 1.18, 3.04, 3.41, 1.25, 6.64, 0.9, 0.02, 2.08, 2.21, 9.01, 0.85, 1.33, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/cY8yXitzluU_filtered.json b/annotations_filtered/cY8yXitzluU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8650d25509de7b3958d108fcba2f2806956b1442 --- /dev/null +++ b/annotations_filtered/cY8yXitzluU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [5.0, 12.12], [17.0, 46.62], [48.0, 48.63], [49.0, 51.09], [53.0, 53.6], [55.0, 56.57], [57.0, 58.55], [60.0, 61.47], [63.0, 82.66], [83.0, 86.41], [88.0, 89.01], [90.0, 92.06], [93.0, 93.8], [97.0, 97.17], [103.0, 104.77], [106.0, 109.66], [111.0, 111.79], [114.0, 117.98], [122.0, 122.69], [125.0, 125.36], [126.0, 127.01], [128.0, 165.32], [166.0, 171.91], [172.0, 179.71], [180.0, 184.76]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 37.28, 42.13, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 45.21, 62.37, 0.0, 89.54, 0.0, 0.0, 0.0, 69.07, 0.0, 52.05, 0.0, 0.0, 0.0, 0.0, 33.94, 39.6, 60.7], "audiomae_on_audioset": [null, [["music", 23.85], ["breaking", 19.13], ["speech", 15.24]], [["music", 69.5], ["didgeridoo", 5.72], ["throbbing", 4.94]], null, null, null, null, null, null, [["coin (dropping)", 20.01], ["music", 16.33], ["noise", 6.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.7], ["moo", 5.25], ["effects unit", 4.2]], [["speech", 22.65], ["music", 21.48], ["hum", 13.58]], null], "duration": [0.26, 7.12, 29.62, 0.63, 2.09, 0.6, 1.57, 1.55, 1.47, 19.66, 3.41, 1.01, 2.06, 0.8, 0.17, 1.77, 3.66, 0.79, 3.98, 0.69, 0.36, 1.01, 37.32, 5.91, 7.71, 4.76]} \ No newline at end of file diff --git a/annotations_filtered/cYGVkLGyGqE_filtered.json b/annotations_filtered/cYGVkLGyGqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b23e4005a217e1ebba53f4430381010e1bd6b64a --- /dev/null +++ b/annotations_filtered/cYGVkLGyGqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 73.33], [74.0, 76.03]], "keep_status": [false, true], "silence_prob": [0.0, 31.99], "audiomae_on_audioset": [null, [["music", 30.32], ["foghorn", 18.28], ["trombone", 17.26]]], "duration": [42.33, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/cYdScH3BmBk_filtered.json b/annotations_filtered/cYdScH3BmBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baba292f32ffa90bcce1034b5252e00653527e99 --- /dev/null +++ b/annotations_filtered/cYdScH3BmBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.53], [14.0, 14.27], [17.0, 26.18], [27.0, 27.06], [40.0, 41.57], [47.0, 60.32], [64.0, 64.22], [64.0, 64.25], [64.0, 64.29], [64.0, 64.66], [70.0, 70.66], [73.0, 72.99], [74.0, 74.24], [80.0, 83.64]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.6, 0.0, 0.0, 31.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.18], "audiomae_on_audioset": [null, null, [["moo", 41.99], ["cattle, bovinae", 31.92], ["livestock, farm animals, working animals", 18.67]], null, null, [["explosion", 37.83], ["burst, pop", 12.59], ["speech", 9.29]], null, null, null, null, null, null, null, null], "duration": [1.53, 0.27, 9.18, 0.06, 1.57, 13.32, 0.22, 0.25, 0.29, 0.66, 0.66, -0.01, 0.24, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/cYjv9uWxW94_filtered.json b/annotations_filtered/cYjv9uWxW94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27f256188c81f9e548d87f20d982069bb4cadd8e --- /dev/null +++ b/annotations_filtered/cYjv9uWxW94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.35], [8.0, 8.16], [11.0, 12.72], [14.0, 16.17], [18.0, 18.93], [25.0, 26.57], [27.0, 27.62], [32.0, 35.09], [36.0, 37.94], [40.0, 41.89], [43.0, 45.3], [49.0, 48.78], [52.0, 53.84], [56.0, 56.96], [65.0, 64.86], [67.0, 67.29], [70.0, 70.36], [72.0, 73.33], [74.0, 75.05], [76.0, 78.07], [79.0, 79.81], [82.0, 83.19], [85.0, 85.48], [87.0, 87.84], [89.0, 91.52], [92.0, 95.89], [97.0, 99.06], [100.0, 100.95], [102.0, 103.08], [104.0, 106.29], [107.0, 107.79], [109.0, 111.57], [114.0, 117.51], [120.0, 122.03], [124.0, 124.11], [127.0, 127.84], [128.0, 134.45], [135.0, 136.7], [137.0, 136.88], [137.0, 139.89], [144.0, 144.61], [153.0, 159.7], [163.0, 164.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 50.16, 76.2, 73.51, 0.0, 0.0, 67.51, 0.0, 68.54, 45.62, 48.23, 0.0, 0.0, 38.9, 0.0, 0.0, 42.53, 0.0, 38.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.74], ["jingle bell", 6.29], ["tambourine", 5.67]], [["throbbing", 26.5], ["hum", 19.47], ["music", 11.88]], null, null, [["music", 33.49], ["speech", 32.79], ["throbbing", 8.26]], null, null, [["music", 63.22], ["musical instrument", 7.18], ["guitar", 6.85]], null, [["music", 49.11], ["speech", 21.81], ["musical instrument", 6.86]], null], "duration": [0.35, 0.16, 1.72, 2.17, 0.93, 1.57, 0.62, 3.09, 1.94, 1.89, 2.3, -0.22, 1.84, 0.96, -0.14, 0.29, 0.36, 1.33, 1.05, 2.07, 0.81, 1.19, 0.48, 0.84, 2.52, 3.89, 2.06, 0.95, 1.08, 2.29, 0.79, 2.57, 3.51, 2.03, 0.11, 0.84, 6.45, 1.7, -0.12, 2.89, 0.61, 6.7, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/cZKYcRqPh-o_filtered.json b/annotations_filtered/cZKYcRqPh-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..238240f0d85a6c1ccc872606a8dcadbb20643b29 --- /dev/null +++ b/annotations_filtered/cZKYcRqPh-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.3], [12.0, 13.36], [15.0, 17.66], [20.0, 21.46], [24.0, 28.43], [31.0, 32.48], [34.0, 42.62], [47.0, 48.36], [51.0, 52.42], [60.0, 60.61], [62.0, 63.22], [65.0, 65.45], [68.0, 68.66], [70.0, 71.24], [74.0, 74.6], [81.0, 86.68], [91.0, 91.86], [97.0, 98.85], [105.0, 106.84], [109.0, 111.97], [115.0, 119.4], [123.0, 124.75], [126.0, 128.98], [133.0, 134.77], [143.0, 144.31], [149.0, 150.99], [151.0, 152.58], [154.0, 155.28], [157.0, 158.73], [161.0, 165.43], [166.0, 168.05], [170.0, 171.15], [173.0, 173.25]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.11, 0.0, 99.73, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 80.82, 91.98, 0.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 96.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 14.25], ["throat clearing", 13.82], ["cough", 13.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 1.36, 2.66, 1.46, 4.43, 1.48, 8.62, 1.36, 1.42, 0.61, 1.22, 0.45, 0.66, 1.24, 0.6, 5.68, 0.86, 1.85, 1.84, 2.97, 4.4, 1.75, 2.98, 1.77, 1.31, 1.99, 1.58, 1.28, 1.73, 4.43, 2.05, 1.15, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/cZP4yFO6l78_filtered.json b/annotations_filtered/cZP4yFO6l78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e16b9068a6aef9015351f07413e09298055b675a --- /dev/null +++ b/annotations_filtered/cZP4yFO6l78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.14], [28.0, 28.17], [31.0, 31.53], [39.0, 39.65], [110.0, 110.76]], "keep_status": [false, false, false, false, false], "silence_prob": [33.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 45.18], ["music", 30.47], ["sidetone", 2.71]], null, null, null, null], "duration": [2.14, 0.17, 0.53, 0.65, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/cZumS81KSw8_filtered.json b/annotations_filtered/cZumS81KSw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ced5f8360e7da02ef8a3f618293924d64f9af38a --- /dev/null +++ b/annotations_filtered/cZumS81KSw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.1], [10.0, 10.12], [16.0, 16.19], [17.0, 19.6], [40.0, 42.7], [44.0, 44.34], [53.0, 52.71], [59.0, 59.7], [84.0, 86.22], [86.0, 87.99], [105.0, 105.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 99.96, 54.23, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 0.12, 0.19, 2.6, 2.7, 0.34, -0.29, 0.7, 2.22, 1.99, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/cZwdCa0ynEw_filtered.json b/annotations_filtered/cZwdCa0ynEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06df865b50033f2716ece235fa929a0f97649ba1 --- /dev/null +++ b/annotations_filtered/cZwdCa0ynEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.75], [9.0, 11.47], [13.0, 24.17], [28.0, 28.98], [29.0, 32.49], [34.0, 34.77], [47.0, 51.33], [52.0, 53.42], [58.0, 58.75], [59.0, 59.64], [61.0, 62.02], [62.0, 62.33], [62.0, 64.76], [65.0, 68.34], [69.0, 71.51], [74.0, 77.72], [81.0, 81.33], [86.0, 85.75], [86.0, 86.29], [88.0, 88.65], [90.0, 93.66], [99.0, 102.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 99.26, 90.08, 0.0, 94.81, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 52.33, 74.76, 66.15, 0.0, 0.0, 0.0, 0.0, 34.15, 52.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.01], ["fly, housefly", 9.79], ["mosquito", 3.4]], null], "duration": [-0.25, 2.47, 11.17, 0.98, 3.49, 0.77, 4.33, 1.42, 0.75, 0.64, 1.02, 0.33, 2.76, 3.34, 2.51, 3.72, 0.33, -0.25, 0.29, 0.65, 3.66, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/cZy7qSG8RHQ_filtered.json b/annotations_filtered/cZy7qSG8RHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d80275d55eda7bfc6a1c5e4bb9374534fbfad3d --- /dev/null +++ b/annotations_filtered/cZy7qSG8RHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [22.0, 22.25], [27.0, 27.9], [29.0, 29.96], [32.0, 31.82], [32.0, 33.0], [33.0, 34.11], [36.0, 42.21], [49.0, 50.48], [69.0, 69.7], [73.0, 73.85], [74.0, 75.46], [78.0, 78.54], [86.0, 86.98], [90.0, 95.59], [104.0, 104.79], [106.0, 106.66], [119.0, 119.52], [129.0, 128.75], [131.0, 132.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["moo", 18.64], ["speech", 18.6], ["cattle, bovinae", 18.07]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.25, 0.9, 0.96, -0.18, 1.0, 1.11, 6.21, 1.48, 0.7, 0.85, 1.46, 0.54, 0.98, 5.59, 0.79, 0.66, 0.52, -0.25, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/c_69KA0PKYI_filtered.json b/annotations_filtered/c_69KA0PKYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a62205bc8f5a6821e8d04c2785e713be5264034 --- /dev/null +++ b/annotations_filtered/c_69KA0PKYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.11], [23.0, 23.79], [25.0, 24.66], [25.0, 26.37], [27.0, 39.77], [48.0, 48.03]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.48, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 72.31], ["speech", 9.43], ["boing", 2.93]], null], "duration": [1.11, 0.79, -0.34, 1.37, 12.77, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/c_6SIVs_M5Q_filtered.json b/annotations_filtered/c_6SIVs_M5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a6d3f8f9887adf004eb968a8ab6ed18e08d3604 --- /dev/null +++ b/annotations_filtered/c_6SIVs_M5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.08], [12.0, 11.87], [13.0, 15.04], [16.0, 16.04], [27.0, 27.31], [30.0, 30.81], [31.0, 31.14], [33.0, 33.47], [34.0, 35.95], [36.0, 55.34], [65.0, 69.04], [74.0, 76.94], [84.0, 89.06], [90.0, 98.71], [100.0, 148.44], [150.0, 157.71]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, true, false, true, false, true], "silence_prob": [32.06, 0.0, 32.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.66, 46.19, 39.52, 32.57, 29.44, 0.0, 33.0], "audiomae_on_audioset": [[["hum", 26.82], ["throbbing", 23.36], ["speech", 14.86]], null, [["music", 47.67], ["foghorn", 4.97], ["musical instrument", 4.69]], null, null, null, null, null, null, [["music", 48.61], ["rumble", 14.7], ["hum", 5.74]], [["speech", 27.51], ["music", 25.33], ["sidetone", 12.75]], [["music", 57.45], ["throbbing", 4.67], ["timpani", 3.14]], [["music", 54.36], ["speech", 16.59], ["throbbing", 6.79]], [["music", 29.69], ["mains hum", 15.01], ["hum", 9.83]], null, [["speech", 18.36], ["buzz", 12.08], ["cattle, bovinae", 7.56]]], "duration": [2.08, -0.13, 2.04, 0.04, 0.31, 0.81, 0.14, 0.47, 1.95, 19.34, 4.04, 2.94, 5.06, 8.71, 48.44, 7.71]} \ No newline at end of file diff --git a/annotations_filtered/c_7V6VgIvTY_filtered.json b/annotations_filtered/c_7V6VgIvTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..828ed569bef2e9aa9dc78d3fc44cf888f54f9a0e --- /dev/null +++ b/annotations_filtered/c_7V6VgIvTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [7.0, 8.14], [11.0, 11.87], [15.0, 18.57], [20.0, 20.49], [30.0, 33.35], [35.0, 35.75], [37.0, 38.55], [40.0, 40.83], [45.0, 44.81], [50.0, 51.12], [53.0, 53.6], [55.0, 55.7], [56.0, 57.55], [58.0, 66.46], [68.0, 71.31], [73.0, 73.47], [78.0, 78.88], [80.0, 80.08], [82.0, 84.99], [85.0, 86.85], [88.0, 93.65], [105.0, 109.46], [110.0, 118.25], [119.0, 120.95]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.9, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 52.62, 0.0, 0.0, 0.0, 98.59, 0.0, 31.42, 40.99, 58.22, 0.0], "audiomae_on_audioset": [null, null, null, [["frog", 24.8], ["speech", 22.14], ["mosquito", 17.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.33], ["thunk", 6.78], ["livestock, farm animals, working animals", 5.88]], [["noise", 28.05], ["hum", 20.98], ["mains hum", 13.77]], null, null], "duration": [1.26, 1.14, 0.87, 3.57, 0.49, 3.35, 0.75, 1.55, 0.83, -0.19, 1.12, 0.6, 0.7, 1.55, 8.46, 3.31, 0.47, 0.88, 0.08, 2.99, 1.85, 5.65, 4.46, 8.25, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/c_GNsQnPdi4_filtered.json b/annotations_filtered/c_GNsQnPdi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb9899e229606e86b1901d86a908497b42051359 --- /dev/null +++ b/annotations_filtered/c_GNsQnPdi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.21], [7.0, 6.93], [7.0, 7.53], [8.0, 8.92], [9.0, 9.31], [10.0, 11.45], [14.0, 29.44], [31.0, 39.06], [41.0, 41.79], [42.0, 49.08], [50.0, 49.94], [50.0, 56.37], [58.0, 61.35], [68.0, 69.25], [75.0, 75.1], [76.0, 84.28], [85.0, 93.09], [98.0, 98.76]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 60.32, 0.0, 48.27, 0.0, 42.98, 58.64, 0.0, 0.0, 43.1, 57.09, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 38.77], ["speech", 13.12], ["animal", 7.04]], null, [["animal", 33.36], ["whale vocalization", 17.0], ["wild animals", 13.61]], null, null, null, [["music", 20.75], ["noise", 7.9], ["mains hum", 6.52]], null, null], "duration": [0.21, -0.07, 0.53, 0.92, 0.31, 1.45, 15.44, 8.06, 0.79, 7.08, -0.06, 6.37, 3.35, 1.25, 0.1, 8.28, 8.09, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/c_SJMeRltkA_filtered.json b/annotations_filtered/c_SJMeRltkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084c3c8902445fce1459e9dc422347ab9e866427 --- /dev/null +++ b/annotations_filtered/c_SJMeRltkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[69.0, 88.06]], "keep_status": [false], "silence_prob": [29.38], "audiomae_on_audioset": [[["speech", 67.53], ["whack, thwack", 3.32], ["fart", 2.51]]], "duration": [19.06]} \ No newline at end of file diff --git a/annotations_filtered/c_TXof1C-OI_filtered.json b/annotations_filtered/c_TXof1C-OI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca7d23444d3ce40f56ef276eb329fe70752a192 --- /dev/null +++ b/annotations_filtered/c_TXof1C-OI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.51], [44.0, 87.94], [89.0, 90.12], [93.0, 93.55], [95.0, 105.33]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.9], "audiomae_on_audioset": [null, null, null, null, [["music", 60.09], ["hum", 9.57], ["throbbing", 7.66]]], "duration": [1.51, 43.94, 1.12, 0.55, 10.33]} \ No newline at end of file diff --git a/annotations_filtered/c__26Uyp5eU_filtered.json b/annotations_filtered/c__26Uyp5eU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b202aa433617f2a426d761cefb5d68f3cfc2a603 --- /dev/null +++ b/annotations_filtered/c__26Uyp5eU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.32], [6.0, 8.63], [12.0, 12.41], [13.0, 13.66], [15.0, 17.09], [19.0, 20.07], [24.0, 26.23], [27.0, 27.78], [38.0, 38.89], [40.0, 41.23], [43.0, 91.64], [94.0, 101.36], [105.0, 106.37], [107.0, 107.42], [115.0, 115.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.47, 99.59, 0.0, 0.0, 91.47, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 32.49, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 73.57], ["electronic music", 5.32], ["throbbing", 4.67]], null, null, null], "duration": [4.32, 2.63, 0.41, 0.66, 2.09, 1.07, 2.23, 0.78, 0.89, 1.23, 48.64, 7.36, 1.37, 0.42, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/c_a5Y18mdLo_filtered.json b/annotations_filtered/c_a5Y18mdLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e8f081f8275ac7368bb86599d6d5526b63af74 --- /dev/null +++ b/annotations_filtered/c_a5Y18mdLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [5.0, 5.97], [6.0, 9.14], [10.0, 10.27], [11.0, 11.26], [12.0, 16.31], [18.0, 19.09], [30.0, 50.41], [52.0, 51.98], [53.0, 53.89], [55.0, 54.85], [55.0, 55.83], [59.0, 59.29], [60.0, 60.3], [61.0, 62.07], [62.0, 63.44], [68.0, 70.04], [71.0, 72.59], [73.0, 74.53], [78.0, 79.0], [81.0, 82.16], [83.0, 82.97], [92.0, 93.19], [95.0, 96.13], [98.0, 98.51], [99.0, 100.2], [101.0, 103.05]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.31, 0.0, 0.0, 61.37, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0], "audiomae_on_audioset": [null, null, [["speech", 40.14], ["insect", 5.09], ["sidetone", 3.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.48], ["sidetone", 16.92], ["hum", 15.88]], null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 0.97, 3.14, 0.27, 0.26, 4.31, 1.09, 20.41, -0.02, 0.89, -0.15, 0.83, 0.29, 0.3, 1.07, 1.44, 2.04, 1.59, 1.53, 1.0, 1.16, -0.03, 1.19, 1.13, 0.51, 1.2, 2.05]} \ No newline at end of file diff --git a/annotations_filtered/c_u4oXd_Lfo_filtered.json b/annotations_filtered/c_u4oXd_Lfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87302d030e820917c9867396d4b2b7d19d252733 --- /dev/null +++ b/annotations_filtered/c_u4oXd_Lfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 115.3], [118.0, 121.73], [123.0, 136.93], [138.0, 155.63], [156.0, 176.86]], "keep_status": [false, true, false, true, true], "silence_prob": [0.0, 36.18, 34.88, 33.04, 33.34], "audiomae_on_audioset": [null, [["speech", 37.31], ["music", 19.27], ["boat, water vehicle", 7.17]], [["music", 35.65], ["speech", 30.31], ["boat, water vehicle", 6.0]], [["hum", 39.17], ["music", 15.34], ["mains hum", 14.36]], [["vehicle", 28.4], ["speech", 16.22], ["car", 10.95]]], "duration": [90.3, 3.73, 13.93, 17.63, 20.86]} \ No newline at end of file diff --git a/annotations_filtered/cacjl7UwuVU_filtered.json b/annotations_filtered/cacjl7UwuVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1727d58a13623c74dcc12f483636dcdb635a852 --- /dev/null +++ b/annotations_filtered/cacjl7UwuVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [4.0, 4.26], [9.0, 9.48], [11.0, 11.37], [27.0, 26.94], [30.0, 31.83], [35.0, 36.07]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.51, 0.26, 0.48, 0.37, -0.06, 1.83, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/cagsLW2dKTI_filtered.json b/annotations_filtered/cagsLW2dKTI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97414557b7ad1fa81e29ac739bf0aeb7081e1aed --- /dev/null +++ b/annotations_filtered/cagsLW2dKTI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 90.71], [91.0, 91.74], [93.0, 98.78], [99.0, 99.6], [100.0, 99.82]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [36.71, 0.74, 5.78, 0.6, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/caypUMEoKf8_filtered.json b/annotations_filtered/caypUMEoKf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c06639dcd7638878590c5b53fb206e80f6c1cda2 --- /dev/null +++ b/annotations_filtered/caypUMEoKf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [8.0, 8.5], [10.0, 10.1], [14.0, 13.78], [17.0, 17.25], [18.0, 20.6], [21.0, 21.56], [23.0, 46.58], [47.0, 54.4], [58.0, 66.31], [66.0, 76.79], [77.0, 77.87], [79.0, 82.54], [86.0, 89.88], [90.0, 93.23], [96.0, 95.82]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.61, 0.0, 35.91, 31.5, 73.97, 33.48, 0.0, 80.46, 82.61, 75.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 69.97], ["sidetone", 8.37], ["radio", 5.35]], null, [["hum", 55.71], ["mains hum", 16.41], ["music", 11.9]], [["speech", 25.37], ["noise", 19.74], ["livestock, farm animals, working animals", 6.84]], null, [["speech", 29.35], ["animal", 10.69], ["livestock, farm animals, working animals", 7.22]], null, null, null, null, null], "duration": [0.67, 0.5, 0.1, -0.22, 0.25, 2.6, 0.56, 23.58, 7.4, 8.31, 10.79, 0.87, 3.54, 3.88, 3.23, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/cb4dxubPYEs_filtered.json b/annotations_filtered/cb4dxubPYEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57bff4fcad30fdbe37b380063d77581369a2048f --- /dev/null +++ b/annotations_filtered/cb4dxubPYEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [8.0, 7.96], [8.0, 8.56], [13.0, 13.27], [14.0, 14.15], [15.0, 15.65], [17.0, 18.94], [20.0, 21.29], [22.0, 22.62], [23.0, 23.26], [24.0, 24.54], [27.0, 28.21], [29.0, 30.1], [31.0, 32.98], [33.0, 33.34], [34.0, 33.86], [35.0, 35.09], [36.0, 36.49], [37.0, 37.32], [39.0, 39.31], [40.0, 41.12], [44.0, 44.25], [45.0, 45.18], [46.0, 46.87], [49.0, 50.14], [50.0, 53.79], [55.0, 55.7], [58.0, 59.29], [61.0, 61.55], [63.0, 63.48], [64.0, 65.62], [66.0, 67.49], [68.0, 76.35], [77.0, 77.25], [79.0, 79.34], [82.0, 83.1], [84.0, 97.6], [98.0, 99.67], [101.0, 101.9], [103.0, 103.65], [105.0, 106.68], [107.0, 111.87], [113.0, 114.64], [115.0, 115.37], [116.0, 116.18], [116.0, 116.58], [118.0, 118.83], [119.0, 120.7], [122.0, 122.93], [125.0, 126.2], [128.0, 129.22], [130.0, 150.35], [151.0, 152.61], [154.0, 161.64], [162.0, 164.0], [166.0, 166.19], [167.0, 168.24], [169.0, 175.15], [177.0, 178.39], [179.0, 179.25], [181.0, 181.57], [183.0, 186.39], [189.0, 190.05], [192.0, 192.08], [193.0, 193.87], [198.0, 216.41], [220.0, 228.06], [229.0, 229.78], [230.0, 233.41], [235.0, 236.61], [237.0, 238.54], [241.0, 243.03], [245.0, 245.44], [247.0, 251.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 100.0, 100.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 98.01, 71.87, 0.0, 97.11, 0.0, 0.0, 78.21, 0.0, 77.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, -0.04, 0.56, 0.27, 0.15, 0.65, 1.94, 1.29, 0.62, 0.26, 0.54, 1.21, 1.1, 1.98, 0.34, -0.14, 0.09, 0.49, 0.32, 0.31, 1.12, 0.25, 0.18, 0.87, 1.14, 3.79, 0.7, 1.29, 0.55, 0.48, 1.62, 1.49, 8.35, 0.25, 0.34, 1.1, 13.6, 1.67, 0.9, 0.65, 1.68, 4.87, 1.64, 0.37, 0.18, 0.58, 0.83, 1.7, 0.93, 1.2, 1.22, 20.35, 1.61, 7.64, 2.0, 0.19, 1.24, 6.15, 1.39, 0.25, 0.57, 3.39, 1.05, 0.08, 0.87, 18.41, 8.06, 0.78, 3.41, 1.61, 1.54, 2.03, 0.44, 4.33]} \ No newline at end of file diff --git a/annotations_filtered/cbEbCrrgWiA_filtered.json b/annotations_filtered/cbEbCrrgWiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27d95ae216563d723cb2d63795cd5f79e0db183a --- /dev/null +++ b/annotations_filtered/cbEbCrrgWiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.99], [12.0, 13.64], [15.0, 15.9], [17.0, 18.77], [24.0, 24.7], [39.0, 38.87], [47.0, 47.97], [54.0, 53.94], [54.0, 55.61], [58.0, 62.36], [63.0, 64.02], [69.0, 75.41], [78.0, 78.56], [79.0, 81.77], [85.0, 96.45], [100.0, 100.14], [101.0, 101.22], [102.0, 102.42], [111.0, 111.69], [112.0, 113.09], [114.0, 116.63], [123.0, 124.51], [125.0, 125.19], [127.0, 126.74], [127.0, 126.96], [128.0, 128.24], [131.0, 131.33], [132.0, 132.27], [135.0, 138.67], [139.0, 140.12], [144.0, 145.3], [151.0, 150.96], [155.0, 166.53], [168.0, 172.03], [173.0, 173.87], [175.0, 176.0], [177.0, 180.81], [181.0, 183.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 36.86, 0.0, 42.86, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 37.31, 84.62, 0.0, 0.0, 68.54, 46.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.23], ["mains hum", 16.28], ["speech", 16.15]], null, [["music", 28.69], ["hum", 14.43], ["didgeridoo", 10.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.13], ["didgeridoo", 9.28], ["musical instrument", 3.84]], null, null, null, null, [["speech", 32.79], ["busy signal", 26.07], ["sine wave", 5.9]]], "duration": [0.99, 1.64, 0.9, 1.77, 0.7, -0.13, 0.97, -0.06, 1.61, 4.36, 1.02, 6.41, 0.56, 2.77, 11.45, 0.14, 0.22, 0.42, 0.69, 1.09, 2.63, 1.51, 0.19, -0.26, -0.04, 0.24, 0.33, 0.27, 3.67, 1.12, 1.3, -0.04, 11.53, 4.03, 0.87, 1.0, 3.81, 2.05]} \ No newline at end of file diff --git a/annotations_filtered/cbH10o2VTXI_filtered.json b/annotations_filtered/cbH10o2VTXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ff32dc6b72acfc962b2ecba07909f70246a5d9 --- /dev/null +++ b/annotations_filtered/cbH10o2VTXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.68], [6.0, 7.52], [9.0, 11.53], [29.0, 31.6], [36.0, 35.94], [39.0, 39.02], [42.0, 42.94], [48.0, 52.66], [64.0, 63.76], [66.0, 65.82], [66.0, 74.31], [78.0, 78.12], [80.0, 90.26], [92.0, 95.12], [117.0, 118.18], [121.0, 121.54], [129.0, 129.14], [140.0, 140.98], [143.0, 145.05], [146.0, 147.23], [150.0, 149.96], [154.0, 157.22], [161.0, 173.53]], "keep_status": [false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.58, 38.08, 0.0, 0.0, 0.0, 33.2, 0.0, 0.0, 41.58, 0.0, 40.93, 40.95, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 50.71, 33.64], "audiomae_on_audioset": [null, null, [["music", 45.54], ["hum", 14.1], ["throbbing", 8.02]], [["speech", 30.87], ["music", 19.75], ["mains hum", 12.68]], null, null, null, [["livestock, farm animals, working animals", 39.89], ["moo", 25.82], ["cattle, bovinae", 25.6]], null, null, [["music", 49.25], ["synthesizer", 7.95], ["theremin", 3.14]], null, [["speech", 38.34], ["music", 33.58], ["grunt", 8.21]], [["music", 71.97], ["speech", 7.01], ["electronic music", 1.54]], null, null, null, null, [["music", 68.72], ["ambient music", 7.23], ["hum", 4.23]], null, null, null, [["music", 65.77], ["theremin", 5.85], ["throbbing", 2.85]]], "duration": [1.68, 1.52, 2.53, 2.6, -0.06, 0.02, 0.94, 4.66, -0.24, -0.18, 8.31, 0.12, 10.26, 3.12, 1.18, 0.54, 0.14, 0.98, 2.05, 1.23, -0.04, 3.22, 12.53]} \ No newline at end of file diff --git a/annotations_filtered/cbN7TQSGYlI_filtered.json b/annotations_filtered/cbN7TQSGYlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff8492802812db3ea1c2a5a17542c791c183b98d --- /dev/null +++ b/annotations_filtered/cbN7TQSGYlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.12], [16.0, 16.31], [19.0, 19.6], [22.0, 23.06], [31.0, 33.67], [35.0, 37.84], [61.0, 85.56], [87.0, 124.11], [127.0, 132.63], [133.0, 133.56], [137.0, 137.05], [139.0, 144.49], [146.0, 146.99], [148.0, 152.41], [153.0, 154.5], [155.0, 158.21], [158.0, 162.19], [165.0, 166.21], [168.0, 169.48], [170.0, 170.28], [183.0, 183.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.76, 34.07, 32.61, 0.0, 43.69, 0.0, 0.0, 39.75, 0.0, 56.33, 0.0, 87.55, 72.9, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 34.0], ["boing", 8.67], ["whale vocalization", 6.32]], [["music", 69.93], ["boing", 16.41], ["throbbing", 1.28]], null, [["music", 83.8], ["electronic music", 1.89], ["musical instrument", 1.54]], null, null, [["music", 48.95], ["pour", 6.78], ["speech", 4.77]], null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.31, 0.6, 1.06, 2.67, 2.84, 24.56, 37.11, 5.63, 0.56, 0.05, 5.49, 0.99, 4.41, 1.5, 3.21, 4.19, 1.21, 1.48, 0.28, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/cbQZ8GK2usU_filtered.json b/annotations_filtered/cbQZ8GK2usU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70274eb445bfc99839df78ec15bfeb1242599ad4 --- /dev/null +++ b/annotations_filtered/cbQZ8GK2usU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [5.0, 22.79], [26.0, 29.71], [30.0, 31.36], [33.0, 42.75], [43.0, 45.03], [46.0, 65.57], [66.0, 66.6], [67.0, 67.66], [68.0, 70.63], [71.0, 70.66], [73.0, 79.39], [80.0, 82.46]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 34.6, 36.15, 0.0, 34.78, 40.62, 31.76, 0.0, 0.0, 46.79, 0.0, 51.94, 100.0], "audiomae_on_audioset": [null, [["music", 50.02], ["speech", 20.2], ["synthesizer", 8.54]], [["speech", 52.88], ["music", 16.6], ["noise", 2.17]], null, [["music", 46.03], ["throbbing", 16.61], ["hum", 12.75]], [["speech", 23.08], ["electric shaver, electric razor", 18.03], ["mains hum", 9.19]], [["music", 51.51], ["synthesizer", 10.8], ["theremin", 8.65]], null, null, [["music", 52.17], ["theremin", 9.73], ["hum", 4.78]], null, null, null], "duration": [0.42, 17.79, 3.71, 1.36, 9.75, 2.03, 19.57, 0.6, 0.66, 2.63, -0.34, 6.39, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/cbzBwleJnLY_filtered.json b/annotations_filtered/cbzBwleJnLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd621aebbaaedf272b497f0da41bb652d745dbcf --- /dev/null +++ b/annotations_filtered/cbzBwleJnLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.48], [14.0, 17.73], [25.0, 26.37], [30.0, 31.8], [33.0, 33.12], [33.0, 34.69], [35.0, 35.41], [37.0, 37.62], [39.0, 40.1], [43.0, 43.09], [47.0, 47.31], [48.0, 58.6], [59.0, 68.82], [73.0, 73.58], [76.0, 76.54], [80.0, 81.89], [85.0, 85.4], [86.0, 86.86], [91.0, 98.56], [100.0, 102.22], [104.0, 104.06], [105.0, 105.22], [110.0, 113.75], [117.0, 125.56], [129.0, 138.7], [139.0, 155.83], [158.0, 159.73], [161.0, 164.05], [164.0, 166.02], [167.0, 167.66], [168.0, 169.59], [171.0, 172.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 54.04, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 100.0, 0.0, 0.0, 69.34, 97.92, 33.23, 73.82, 0.0, 60.7, 50.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.69], ["thunk", 21.42], ["explosion", 12.35]], null, null, null, null, null, null, null], "duration": [0.48, 3.73, 1.37, 1.8, 0.12, 1.69, 0.41, 0.62, 1.1, 0.09, 0.31, 10.6, 9.82, 0.58, 0.54, 1.89, 0.4, 0.86, 7.56, 2.22, 0.06, 0.22, 3.75, 8.56, 9.7, 16.83, 1.73, 3.05, 2.02, 0.66, 1.59, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/cbzkmMaYSNg_filtered.json b/annotations_filtered/cbzkmMaYSNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb974746ef71a2e3050d2cd927f589325dccaf7 --- /dev/null +++ b/annotations_filtered/cbzkmMaYSNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.69], [19.0, 20.33], [24.0, 25.57], [32.0, 32.9], [35.0, 38.8], [40.0, 41.77], [43.0, 43.9], [46.0, 46.38], [48.0, 48.29], [51.0, 59.22], [63.0, 63.51], [68.0, 68.69], [71.0, 71.86], [72.0, 73.84], [76.0, 78.73], [84.0, 85.23], [86.0, 87.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.63, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 53.22, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.69, 1.33, 1.57, 0.9, 3.8, 1.77, 0.9, 0.38, 0.29, 8.22, 0.51, 0.69, 0.86, 1.84, 2.73, 1.23, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/ccH057kbWTg_filtered.json b/annotations_filtered/ccH057kbWTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01513aa5ef606d0b0e72d407f9c05e194c436120 --- /dev/null +++ b/annotations_filtered/ccH057kbWTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [9.0, 9.69], [11.0, 12.73], [15.0, 15.5], [19.0, 22.22], [32.0, 33.61], [40.0, 42.45], [46.0, 45.99], [46.0, 47.26], [50.0, 52.37], [57.0, 57.18], [57.0, 62.34], [66.0, 67.12], [69.0, 72.86], [78.0, 80.18], [81.0, 92.47], [94.0, 96.89], [99.0, 116.77], [117.0, 116.97], [117.0, 118.45], [120.0, 131.45], [133.0, 142.03], [143.0, 144.29], [148.0, 148.24], [151.0, 152.52], [154.0, 155.8], [163.0, 164.08], [167.0, 167.66], [173.0, 173.25], [174.0, 178.12], [180.0, 180.08], [183.0, 199.42], [202.0, 203.07]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 31.61, 0.0, 0.0, 33.47, 0.0, 32.48, 0.0, 31.75, 38.9, 38.79, 44.57, 43.87, 0.0, 0.0, 30.06, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.61, 0.0, 30.87, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.16], ["ambient music", 5.53], ["singing", 3.23]], null, [["music", 74.43], ["singing", 2.37], ["carnatic music", 2.14]], null, null, [["music", 44.46], ["double bass", 6.56], ["humming", 5.82]], null, [["music", 67.21], ["singing", 6.7], ["electronic tuner", 2.63]], null, [["music", 66.85], ["singing", 4.67], ["musical instrument", 2.7]], [["music", 42.93], ["carnatic music", 27.26], ["musical instrument", 3.34]], [["music", 56.46], ["flute", 12.95], ["theremin", 6.13]], [["music", 30.34], ["speech", 14.59], ["singing bowl", 13.34]], [["music", 64.51], ["synthesizer", 6.78], ["musical instrument", 3.63]], null, null, [["music", 45.72], ["cello", 5.69], ["theremin", 3.54]], [["music", 30.64], ["singing bowl", 16.57], ["theremin", 6.15]], null, null, null, null, null, null, null, [["music", 44.99], ["speech", 19.14], ["hum", 7.25]], null, [["music", 40.46], ["speech", 16.37], ["fly, housefly", 5.74]], null], "duration": [0.88, 0.69, 1.73, 0.5, 3.22, 1.61, 2.45, -0.01, 1.26, 2.37, 0.18, 5.34, 1.12, 3.86, 2.18, 11.47, 2.89, 17.77, -0.03, 1.45, 11.45, 9.03, 1.29, 0.24, 1.52, 1.8, 1.08, 0.66, 0.25, 4.12, 0.08, 16.42, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/ccU8NJFeBSA_filtered.json b/annotations_filtered/ccU8NJFeBSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c4f6722a9b380f4b5a714dc2a3d29507c2bb804 --- /dev/null +++ b/annotations_filtered/ccU8NJFeBSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 98.54], [100.0, 101.43], [105.0, 108.33], [109.0, 112.38]], "keep_status": [true, false, false, true], "silence_prob": [32.82, 0.0, 31.97, 33.35], "audiomae_on_audioset": [[["music", 40.39], ["didgeridoo", 15.85], ["hum", 4.56]], null, [["fly, housefly", 46.08], ["insect", 26.66], ["fart", 9.27]], [["speech", 26.17], ["didgeridoo", 11.19], ["frog", 6.68]]], "duration": [22.54, 1.43, 3.33, 3.38]} \ No newline at end of file diff --git a/annotations_filtered/ccX1d19hmc8_filtered.json b/annotations_filtered/ccX1d19hmc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe01ca57be69936de03ceedfde1bbf6f813cb1f --- /dev/null +++ b/annotations_filtered/ccX1d19hmc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 45.27], [46.0, 48.68], [49.0, 50.26], [52.0, 52.51], [53.0, 53.91], [55.0, 56.24], [58.0, 58.16], [73.0, 73.23], [81.0, 82.46], [87.0, 87.42], [94.0, 100.68], [102.0, 101.95], [104.0, 104.19], [104.0, 106.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.7, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 78.38], "audiomae_on_audioset": [[["music", 69.02], ["speech", 10.17], ["guitar", 2.77]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.27, 2.68, 1.26, 0.51, 0.91, 1.24, 0.16, 0.23, 1.46, 0.42, 6.68, -0.05, 0.19, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/ccr0gfJ5q0I_filtered.json b/annotations_filtered/ccr0gfJ5q0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f96600fbd0151dc867315dba717f71eca7f9e4a5 --- /dev/null +++ b/annotations_filtered/ccr0gfJ5q0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 82.16], [83.0, 83.54], [90.0, 94.9], [97.0, 98.96], [100.0, 100.74], [101.0, 102.52], [104.0, 104.77], [106.0, 106.07], [112.0, 113.48], [114.0, 114.71], [115.0, 115.84], [122.0, 125.52], [127.0, 127.79], [129.0, 129.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.54, 4.9, 1.96, 0.74, 1.52, 0.77, 0.07, 1.48, 0.71, 0.84, 3.52, 0.79, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/ccyYHEuCHKE_filtered.json b/annotations_filtered/ccyYHEuCHKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..636791daeb714cec6413d2f56fae48d5af70a1cf --- /dev/null +++ b/annotations_filtered/ccyYHEuCHKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 43.65], [62.0, 63.76], [88.0, 88.47], [89.0, 98.0]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null], "duration": [0.65, 1.76, 0.47, 9.0]} \ No newline at end of file diff --git a/annotations_filtered/cdFiubg8UnQ_filtered.json b/annotations_filtered/cdFiubg8UnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25061066fedcace4f0c5b4305104a8cea4e8327c --- /dev/null +++ b/annotations_filtered/cdFiubg8UnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.32], [6.0, 6.39], [6.0, 6.45], [11.0, 12.38], [19.0, 19.79], [22.0, 23.25], [26.0, 27.21], [28.0, 28.93], [31.0, 32.29], [34.0, 37.84], [42.0, 42.26], [44.0, 45.44], [49.0, 50.94], [55.0, 60.17], [63.0, 63.73], [64.0, 68.91], [70.0, 70.92], [74.0, 75.83], [81.0, 82.58], [84.0, 89.28], [92.0, 95.35], [96.0, 97.65], [100.0, 105.53], [106.0, 108.53], [109.0, 122.91], [124.0, 124.6], [130.0, 131.18], [134.0, 137.67], [140.0, 142.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 79.59, 0.0, 86.64, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 85.72, 96.04, 45.69, 0.0, 0.0, 68.15, 99.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.87], ["speech", 7.19], ["hum", 4.68]], null, null, null, null], "duration": [4.32, 0.39, 0.45, 1.38, 0.79, 1.25, 1.21, 0.93, 1.29, 3.84, 0.26, 1.44, 1.94, 5.17, 0.73, 4.91, 0.92, 1.83, 1.58, 5.28, 3.35, 1.65, 5.53, 2.53, 13.91, 0.6, 1.18, 3.67, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/cdVMT44nWzk_filtered.json b/annotations_filtered/cdVMT44nWzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29ce9ac2e338e38b0ace51002d18682cd5e1641b --- /dev/null +++ b/annotations_filtered/cdVMT44nWzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.6], [22.0, 27.97], [29.0, 29.07], [30.0, 30.43], [31.0, 34.08], [40.0, 41.81], [52.0, 52.22], [60.0, 61.35], [66.0, 67.71], [68.0, 69.69], [71.0, 72.0], [73.0, 73.6], [75.0, 75.14], [76.0, 76.49], [78.0, 79.39], [80.0, 80.81], [88.0, 89.11], [90.0, 98.15], [101.0, 101.55], [104.0, 105.04], [109.0, 109.68]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 38.94, 0.0, 0.0, 37.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["breaking", 30.41], ["crack", 10.9], ["rumble", 6.45]], null, null, [["hum", 7.32], ["cattle, bovinae", 7.19], ["speech", 7.18]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.98], ["groan", 13.39], ["explosion", 11.99]], null, null, null], "duration": [1.6, 5.97, 0.07, 0.43, 3.08, 1.81, 0.22, 1.35, 1.71, 1.69, 1.0, 0.6, 0.14, 0.49, 1.39, 0.81, 1.11, 8.15, 0.55, 1.04, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/cdaDQcs-XNQ_filtered.json b/annotations_filtered/cdaDQcs-XNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eea8da595c00a11b0294aac03bb8d8b6236f0306 --- /dev/null +++ b/annotations_filtered/cdaDQcs-XNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.18], [15.0, 16.07], [17.0, 20.8], [25.0, 26.59], [29.0, 30.25], [35.0, 35.29], [39.0, 40.47], [46.0, 49.1], [52.0, 55.95], [58.0, 58.85], [67.0, 71.93], [73.0, 84.92], [86.0, 88.8], [90.0, 94.95], [96.0, 98.27], [99.0, 109.21], [110.0, 111.15], [111.0, 112.01], [112.0, 118.18], [120.0, 124.95], [125.0, 127.36], [129.0, 129.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 47.12, 100.0, 100.0, 100.0, 100.0, 91.13, 0.0, 0.0, 99.48, 83.16, 69.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 75.25], ["dial tone", 6.44], ["inside, small room", 3.89]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 1.07, 3.8, 1.59, 1.25, 0.29, 1.47, 3.1, 3.95, 0.85, 4.93, 11.92, 2.8, 4.95, 2.27, 10.21, 1.15, 1.01, 6.18, 4.95, 2.36, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/cdkS0TgEG30_filtered.json b/annotations_filtered/cdkS0TgEG30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b7e8eb9e891dc84f1cb777e3cea445fbbf2cd16 --- /dev/null +++ b/annotations_filtered/cdkS0TgEG30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 96.01], [100.0, 103.69], [104.0, 107.81], [108.0, 114.47], [116.0, 117.02], [118.0, 118.93], [120.0, 123.79], [125.0, 127.52]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [35.77, 72.46, 48.48, 53.53, 0.0, 0.0, 62.07, 67.13], "audiomae_on_audioset": [[["speech", 83.89], ["telephone", 3.92], ["inside, small room", 3.33]], null, [["whale vocalization", 53.33], ["stomach rumble", 6.2], ["squish", 3.93]], null, null, null, null, null], "duration": [2.01, 3.69, 3.81, 6.47, 1.02, 0.93, 3.79, 2.52]} \ No newline at end of file diff --git a/annotations_filtered/ce5cnb_5dVk_filtered.json b/annotations_filtered/ce5cnb_5dVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48ba0ac3e0e9d482ca9bdb93512cc72488443fee --- /dev/null +++ b/annotations_filtered/ce5cnb_5dVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.09], [18.0, 22.33], [24.0, 40.76], [42.0, 45.0], [49.0, 50.16], [51.0, 54.4], [56.0, 58.19], [61.0, 61.18], [62.0, 62.43], [63.0, 63.68], [68.0, 68.59], [70.0, 71.29], [72.0, 79.86], [80.0, 80.42], [80.0, 80.45], [80.0, 80.49], [81.0, 80.52], [82.0, 81.82], [82.0, 86.7], [90.0, 90.69], [91.0, 95.22], [97.0, 99.08], [100.0, 100.72], [104.0, 104.63], [108.0, 108.63], [120.0, 120.72], [121.0, 127.3], [128.0, 131.03], [135.0, 135.84], [136.0, 138.05], [138.0, 141.52], [142.0, 142.05], [142.0, 142.1], [143.0, 146.37], [149.0, 149.42], [153.0, 155.16]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [49.45, 78.55, 43.05, 46.05, 0.0, 34.82, 50.71, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.67, 0.0, 64.75, 77.36, 0.0, 0.0, 0.0, 0.0, 44.2, 33.81, 0.0, 34.47, 33.22, 0.0, 0.0, 35.57, 0.0, 58.72], "audiomae_on_audioset": [[["music", 14.74], ["livestock, farm animals, working animals", 10.18], ["sidetone", 9.64]], null, [["music", 44.97], ["radio", 5.39], ["hum", 3.94]], [["hum", 36.74], ["mains hum", 32.66], ["buzz", 7.0]], null, [["music", 23.31], ["hum", 20.51], ["pulse", 8.63]], null, null, null, null, null, null, [["music", 33.24], ["hum", 25.84], ["mains hum", 13.38]], null, null, null, null, null, [["music", 32.14], ["hum", 23.77], ["throbbing", 14.73]], null, null, null, null, null, null, null, [["music", 46.75], ["didgeridoo", 35.98], ["theremin", 2.7]], [["music", 43.09], ["carnatic music", 10.0], ["musical instrument", 4.23]], null, [["music", 33.88], ["speech", 21.22], ["theremin", 11.76]], [["speech", 34.1], ["theremin", 26.89], ["music", 16.63]], null, null, [["music", 41.57], ["speech", 30.83], ["musical instrument", 3.34]], null, null], "duration": [9.09, 4.33, 16.76, 3.0, 1.16, 3.4, 2.19, 0.18, 0.43, 0.68, 0.59, 1.29, 7.86, 0.42, 0.45, 0.49, -0.48, -0.18, 4.7, 0.69, 4.22, 2.08, 0.72, 0.63, 0.63, 0.72, 6.3, 3.03, 0.84, 2.05, 3.52, 0.05, 0.1, 3.37, 0.42, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/ceTBcVLeUtI_filtered.json b/annotations_filtered/ceTBcVLeUtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb4f52c1b0a9de1dd93cfc6355f79dc804bdd53f --- /dev/null +++ b/annotations_filtered/ceTBcVLeUtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [6.0, 6.99], [9.0, 10.76], [12.0, 12.19], [16.0, 16.75], [18.0, 18.0], [18.0, 19.7], [21.0, 22.77], [23.0, 25.0], [27.0, 36.51], [44.0, 43.97], [45.0, 46.13], [48.0, 51.93], [54.0, 54.09], [56.0, 58.45], [59.0, 60.02], [61.0, 62.51], [69.0, 71.04], [72.0, 73.09], [75.0, 77.09], [82.0, 83.56], [87.0, 87.91], [90.0, 90.8], [99.0, 101.41], [102.0, 110.12]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 46.61, 0.0, 0.0, 47.58, 0.0, 49.64, 0.0, 0.0, 53.28, 0.0, 52.16, 0.0, 0.0, 0.0, 50.16, 43.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 43.97], ["didgeridoo", 11.45], ["throbbing", 5.27]], [["throbbing", 47.42], ["hum", 36.42], ["music", 7.89]], null, null, [["music", 60.81], ["theremin", 17.9], ["didgeridoo", 2.77]], null, [["music", 49.67], ["hum", 21.4], ["throbbing", 10.55]], null, null, null, null, null, null, null, null, null, [["music", 59.67], ["throbbing", 13.27], ["didgeridoo", 6.03]]], "duration": [0.85, 0.99, 1.76, 0.19, 0.75, 0.0, 1.7, 1.77, 2.0, 9.51, -0.03, 1.13, 3.93, 0.09, 2.45, 1.02, 1.51, 2.04, 1.09, 2.09, 1.56, 0.91, 0.8, 2.41, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/ceWNY5eNSWY_filtered.json b/annotations_filtered/ceWNY5eNSWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10469844e7e03983aaf538fb42cc3f338b396103 --- /dev/null +++ b/annotations_filtered/ceWNY5eNSWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [11.0, 11.13], [20.0, 20.22], [22.0, 22.37], [24.0, 25.34], [28.0, 29.59], [30.0, 32.37], [40.0, 41.13], [42.0, 42.03], [50.0, 52.32], [53.0, 53.23], [55.0, 56.47], [58.0, 60.93], [64.0, 65.28], [71.0, 71.32], [73.0, 72.82], [76.0, 77.67], [96.0, 98.24], [100.0, 102.95], [105.0, 106.71], [107.0, 107.92], [112.0, 112.13], [113.0, 114.03], [117.0, 119.64], [122.0, 130.23], [131.0, 132.02], [132.0, 133.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 44.84, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 37.75, 99.78, 0.0, 0.0, 0.0, 0.0, 71.29, 67.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.22], ["sine wave", 27.82], ["chirp tone", 11.34]], null, null, null, null, null, null, null, [["speech", 20.08], ["sine wave", 19.86], ["chirp tone", 11.81]], null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.13, 0.22, 0.37, 1.34, 1.59, 2.37, 1.13, 0.03, 2.32, 0.23, 1.47, 2.93, 1.28, 0.32, -0.18, 1.67, 2.24, 2.95, 1.71, 0.92, 0.13, 1.03, 2.64, 8.23, 1.02, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/cfB1QaweRKU_filtered.json b/annotations_filtered/cfB1QaweRKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9c7959228ee2e1345934965b8bf5fdf2bf18ff1 --- /dev/null +++ b/annotations_filtered/cfB1QaweRKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 1.8], [2.0, 2.0], [2.0, 3.64], [5.0, 6.72], [8.0, 9.86], [12.0, 13.2], [17.0, 19.84], [21.0, 23.36], [24.0, 64.13], [64.0, 64.96], [68.0, 75.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 64.75, 0.0, 0.0, 34.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 60.16], ["throbbing", 16.5], ["mains hum", 5.22]]], "duration": [0.53, -0.2, 0.0, 1.64, 1.72, 1.86, 1.2, 2.84, 2.36, 40.13, 0.96, 7.91]} \ No newline at end of file diff --git a/annotations_filtered/cfB9siDjpLk_filtered.json b/annotations_filtered/cfB9siDjpLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f01db1437c2e37883330a40090ce18d08bd2685 --- /dev/null +++ b/annotations_filtered/cfB9siDjpLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [4.0, 5.05], [12.0, 12.8], [14.0, 14.72], [16.0, 16.68], [18.0, 18.5], [34.0, 33.78], [34.0, 33.81], [34.0, 33.84], [34.0, 34.21], [35.0, 35.01], [40.0, 40.05], [41.0, 41.54], [43.0, 43.73], [45.0, 45.59], [47.0, 47.68], [57.0, 59.9], [64.0, 64.34], [93.0, 98.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 30.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.22], ["grunt", 7.67], ["animal", 7.21]], null, [["breaking", 20.0], ["whack, thwack", 17.33], ["clang", 11.48]]], "duration": [1.64, 1.05, 0.8, 0.72, 0.68, 0.5, -0.22, -0.19, -0.16, 0.21, 0.01, 0.05, 0.54, 0.73, 0.59, 0.68, 2.9, 0.34, 5.73]} \ No newline at end of file diff --git a/annotations_filtered/cfDwQbxRoEo_filtered.json b/annotations_filtered/cfDwQbxRoEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f2558a627b1cc77918544d94f6520ddc3c94a53 --- /dev/null +++ b/annotations_filtered/cfDwQbxRoEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.62], [30.0, 30.33], [30.0, 31.6], [36.0, 36.1], [38.0, 39.63], [44.0, 44.64], [46.0, 51.85], [58.0, 87.67], [89.0, 91.34], [98.0, 107.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.04, 39.58, 33.81, 34.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 63.15], ["theremin", 16.72], ["ambient music", 5.94]], [["music", 56.31], ["theremin", 21.29], ["musical instrument", 2.22]], [["music", 68.09], ["musical instrument", 8.95], ["clarinet", 3.73]]], "duration": [0.62, 0.33, 1.6, 0.1, 1.63, 0.64, 5.85, 29.67, 2.34, 9.77]} \ No newline at end of file diff --git a/annotations_filtered/cfILhtwu9S0_filtered.json b/annotations_filtered/cfILhtwu9S0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22ad15ce4bcf7e298434ec14c01995e293424b67 --- /dev/null +++ b/annotations_filtered/cfILhtwu9S0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.99], [17.0, 18.15], [19.0, 19.68], [21.0, 21.84], [22.0, 22.22], [25.0, 28.65], [30.0, 30.28], [38.0, 38.85], [42.0, 44.17], [45.0, 45.17], [46.0, 47.61], [51.0, 52.62], [54.0, 55.27], [57.0, 57.84], [58.0, 58.83], [63.0, 65.84], [67.0, 68.42], [70.0, 71.74], [74.0, 74.46], [77.0, 86.76], [88.0, 88.65], [91.0, 91.67], [95.0, 97.97], [100.0, 100.57], [107.0, 107.23], [111.0, 111.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [35.05, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 35.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 34.89, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 62.84], ["musical instrument", 9.29], ["guitar", 5.53]], null, null, null, null, null, null, null, [["speech", 45.67], ["sine wave", 30.6], ["chirp tone", 5.07]], null, null, null, null, null, null, [["music", 64.48], ["synthesizer", 7.62], ["electronic music", 5.0]], null, null, null, [["music", 72.24], ["synthesizer", 9.38], ["musical instrument", 5.26]], null, null, [["vehicle", 27.37], ["race car, auto racing", 14.81], ["car", 12.56]], null, null, null], "duration": [12.99, 1.15, 0.68, 0.84, 0.22, 3.65, 0.28, 0.85, 2.17, 0.17, 1.61, 1.62, 1.27, 0.84, 0.83, 2.84, 1.42, 1.74, 0.46, 9.76, 0.65, 0.67, 2.97, 0.57, 0.23, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/cfM9_PduF3M_filtered.json b/annotations_filtered/cfM9_PduF3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..110df285f81c19770a9963356f1666a38d093e96 --- /dev/null +++ b/annotations_filtered/cfM9_PduF3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [5.0, 4.83], [8.0, 10.03], [11.0, 13.49], [20.0, 26.72], [29.0, 67.91], [70.0, 84.47], [85.0, 86.29], [88.0, 90.98], [94.0, 98.93], [100.0, 102.57]], "keep_status": [false, false, true, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 43.77, 30.82, 29.84, 0.0, 29.77, 0.0, 45.3, 72.16, 75.07], "audiomae_on_audioset": [null, null, [["music", 27.47], ["fly, housefly", 6.8], ["bee, wasp, etc.", 5.8]], [["cattle, bovinae", 30.05], ["moo", 22.04], ["speech", 16.1]], [["speech", 29.62], ["music", 13.16], ["hum", 8.46]], null, [["explosion", 37.55], ["speech", 19.47], ["burst, pop", 14.62]], null, [["speech", 51.58], ["throbbing", 5.51], ["hum", 4.05]], null, null], "duration": [0.8, -0.17, 2.03, 2.49, 6.72, 38.91, 14.47, 1.29, 2.98, 4.93, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/cfNzZre-sIU_filtered.json b/annotations_filtered/cfNzZre-sIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdce43905e9608680e4473c02054d3b932e2d2f0 --- /dev/null +++ b/annotations_filtered/cfNzZre-sIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 26.25], [26.0, 26.28], [32.0, 32.7], [33.0, 34.57], [36.0, 36.51], [38.0, 40.22], [44.0, 47.21], [48.0, 49.3], [50.0, 50.41], [52.0, 52.32], [58.0, 58.63], [59.0, 60.44], [61.0, 61.47], [64.0, 64.32], [68.0, 69.03], [69.0, 72.94], [79.0, 83.25], [86.0, 86.41], [88.0, 88.45], [92.0, 91.83], [92.0, 105.31], [107.0, 114.81], [119.0, 130.94], [132.0, 131.94], [132.0, 138.82], [140.0, 139.97], [141.0, 142.05], [146.0, 146.87], [150.0, 154.41], [155.0, 155.58], [161.0, 161.38]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, false, true, false, false], "silence_prob": [43.51, 0.0, 0.0, 0.0, 0.0, 46.94, 40.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.76, 37.04, 0.0, 0.0, 0.0, 38.63, 37.92, 38.76, 0.0, 39.09, 0.0, 0.0, 0.0, 37.49, 0.0, 0.0], "audiomae_on_audioset": [[["music", 16.09], ["throbbing", 12.03], ["hum", 9.15]], null, null, null, null, [["speech", 20.01], ["hum", 17.36], ["music", 12.7]], [["music", 27.7], ["hum", 20.04], ["mains hum", 14.7]], null, null, null, null, null, null, null, null, [["music", 62.06], ["musical instrument", 4.38], ["guitar", 3.72]], [["music", 25.57], ["hum", 24.31], ["mains hum", 15.01]], null, null, null, [["music", 82.94], ["crackle", 3.44], ["throbbing", 1.13]], [["music", 42.46], ["hum", 11.28], ["mains hum", 9.07]], [["music", 68.63], ["theremin", 6.86], ["musical instrument", 4.08]], null, [["music", 30.98], ["mains hum", 20.2], ["hum", 17.65]], null, null, null, [["music", 45.99], ["speech", 12.1], ["musical instrument", 2.67]], null, null], "duration": [21.25, 0.28, 0.7, 1.57, 0.51, 2.22, 3.21, 1.3, 0.41, 0.32, 0.63, 1.44, 0.47, 0.32, 1.03, 3.94, 4.25, 0.41, 0.45, -0.17, 13.31, 7.81, 11.94, -0.06, 6.82, -0.03, 1.05, 0.87, 4.41, 0.58, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/cfnBcA2ckeQ_filtered.json b/annotations_filtered/cfnBcA2ckeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1453ce3e4c869e453fe6db860e84ab6056df80fc --- /dev/null +++ b/annotations_filtered/cfnBcA2ckeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 117.32], [123.0, 123.67], [126.0, 125.96]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [106.32, 0.67, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/cg-wxqxxWs4_filtered.json b/annotations_filtered/cg-wxqxxWs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d1bb8fa9687ee7b76cedda55a7bfbd1a55eb63b --- /dev/null +++ b/annotations_filtered/cg-wxqxxWs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [7.0, 7.69], [15.0, 15.03], [17.0, 17.51], [27.0, 27.9], [31.0, 35.6], [37.0, 38.92], [40.0, 40.71], [44.0, 45.33], [48.0, 51.0], [55.0, 55.22], [57.0, 59.83], [62.0, 64.42], [71.0, 70.85], [79.0, 89.95], [91.0, 93.18]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [44.46, 0.0, 0.0, 0.0, 0.0, 48.87, 0.0, 0.0, 0.0, 53.84, 0.0, 45.27, 33.5, 0.0, 31.49, 30.97], "audiomae_on_audioset": [[["music", 34.63], ["hum", 12.54], ["synthesizer", 10.07]], null, null, null, null, [["hum", 37.98], ["throbbing", 12.26], ["music", 11.74]], null, null, null, null, null, [["fart", 9.6], ["music", 8.35], ["rumble", 7.97]], [["music", 44.92], ["synthesizer", 7.19], ["hum", 5.55]], null, [["music", 52.45], ["theremin", 11.84], ["hum", 5.77]], [["music", 65.13], ["synthesizer", 5.84], ["hum", 5.41]]], "duration": [3.33, 0.69, 0.03, 0.51, 0.9, 4.6, 1.92, 0.71, 1.33, 3.0, 0.22, 2.83, 2.42, -0.15, 10.95, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/cg49Y3jpZsQ_filtered.json b/annotations_filtered/cg49Y3jpZsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b6b0d519c05ebf829472cfd51fbc00efae5f2b --- /dev/null +++ b/annotations_filtered/cg49Y3jpZsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.44], [10.0, 10.15], [13.0, 13.2], [18.0, 19.85], [28.0, 28.93], [31.0, 31.92], [35.0, 35.58], [37.0, 53.6], [55.0, 57.38], [58.0, 60.12], [62.0, 64.25], [71.0, 75.81], [76.0, 77.23], [78.0, 78.14], [87.0, 87.35], [90.0, 108.45], [112.0, 121.68]], "keep_status": [true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true], "silence_prob": [38.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.45, 31.16, 30.75, 30.0, 30.12, 0.0, 0.0, 0.0, 29.36, 37.36], "audiomae_on_audioset": [[["speech", 26.97], ["music", 21.0], ["outside, rural or natural", 4.22]], null, null, null, null, null, null, [["hum", 33.14], ["throbbing", 18.08], ["mains hum", 15.64]], [["music", 63.06], ["speech", 18.42], ["scary music", 4.1]], [["music", 31.48], ["speech", 16.01], ["moo", 6.4]], [["hum", 34.94], ["mains hum", 32.7], ["music", 12.62]], [["vehicle", 40.18], ["car", 12.17], ["race car, auto racing", 5.74]], null, null, null, [["buzz", 59.74], ["music", 23.83], ["speech", 1.99]], [["hum", 21.93], ["boing", 12.59], ["music", 10.07]]], "duration": [3.44, 0.15, 0.2, 1.85, 0.93, 0.92, 0.58, 16.6, 2.38, 2.12, 2.25, 4.81, 1.23, 0.14, 0.35, 18.45, 9.68]} \ No newline at end of file diff --git a/annotations_filtered/cg7wSv4ALRo_filtered.json b/annotations_filtered/cg7wSv4ALRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bff40abea282add81898e3aaddb565e0a5e8c71 --- /dev/null +++ b/annotations_filtered/cg7wSv4ALRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.99], [15.0, 27.16], [29.0, 35.04], [35.0, 48.0]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 31.71, 44.6, 34.53], "audiomae_on_audioset": [null, [["music", 64.37], ["hum", 5.72], ["throbbing", 2.55]], [["music", 38.02], ["theremin", 29.66], ["hum", 4.52]], [["music", 46.89], ["noise", 10.8], ["hum", 8.25]]], "duration": [0.99, 12.16, 6.04, 13.0]} \ No newline at end of file diff --git a/annotations_filtered/cgBAJefErZY_filtered.json b/annotations_filtered/cgBAJefErZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b573d2c07df6bd66d8af00bd56d26a1373e036d --- /dev/null +++ b/annotations_filtered/cgBAJefErZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [11.0, 19.43], [21.0, 21.54], [32.0, 32.07], [33.0, 54.18], [56.0, 56.86]], "keep_status": [false, true, false, false, true, false], "silence_prob": [0.0, 30.6, 0.0, 0.0, 30.17, 0.0], "audiomae_on_audioset": [null, [["speech", 34.0], ["music", 17.19], ["hum", 16.32]], null, null, [["hum", 26.63], ["mains hum", 19.42], ["music", 13.62]], null], "duration": [0.51, 8.43, 0.54, 0.07, 21.18, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/cgBz4BKSLRQ_filtered.json b/annotations_filtered/cgBz4BKSLRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41326aa27e1feb144378a10b2e12434f7d2507e0 --- /dev/null +++ b/annotations_filtered/cgBz4BKSLRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.48], [5.0, 6.3], [14.0, 20.22], [22.0, 22.2], [29.0, 29.49], [30.0, 31.78], [33.0, 55.81], [62.0, 61.96], [62.0, 69.7], [74.0, 76.1], [80.0, 120.31], [121.0, 123.01], [124.0, 123.94], [129.0, 129.9], [131.0, 133.12], [134.0, 134.91], [136.0, 166.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.78, 0.0, 34.51, 0.0, 0.0, 0.0, 32.15, 0.0, 32.34, 31.6, 0.0, 40.55, 0.0, 0.0, 32.26, 0.0, 0.0], "audiomae_on_audioset": [[["music", 81.77], ["throbbing", 2.94], ["synthesizer", 2.72]], null, [["music", 42.26], ["speech", 26.65], ["tabla", 3.46]], null, null, null, [["music", 63.54], ["didgeridoo", 11.72], ["speech", 2.92]], null, [["music", 76.27], ["musical instrument", 3.0], ["synthesizer", 2.97]], [["music", 47.9], ["didgeridoo", 23.93], ["speech", 12.93]], null, [["music", 40.05], ["speech", 37.47], ["sidetone", 2.79]], null, null, [["music", 44.79], ["sidetone", 22.28], ["speech", 7.14]], null, null], "duration": [2.48, 1.3, 6.22, 0.2, 0.49, 1.78, 22.81, -0.04, 7.7, 2.1, 40.31, 2.01, -0.06, 0.9, 2.12, 0.91, 30.68]} \ No newline at end of file diff --git a/annotations_filtered/cgLMSMIU124_filtered.json b/annotations_filtered/cgLMSMIU124_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a3b4ec029badd09a079aff800a700f04ca90cf8 --- /dev/null +++ b/annotations_filtered/cgLMSMIU124_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 88.57], [89.0, 90.42], [91.0, 92.5], [93.0, 96.8], [103.0, 103.44], [115.0, 114.89], [123.0, 123.94], [129.0, 129.61]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.01, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["breaking", 36.4], ["whack, thwack", 24.95], ["speech", 11.0]], null, null, null, null], "duration": [64.57, 1.42, 1.5, 3.8, 0.44, -0.11, 0.94, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/cgXTRSSX3cc_filtered.json b/annotations_filtered/cgXTRSSX3cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13e34c088dc91b72d2a91fa86dec6992b4022a56 --- /dev/null +++ b/annotations_filtered/cgXTRSSX3cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 7.48], [10.0, 10.83], [13.0, 27.09], [29.0, 29.19], [37.0, 37.39], [38.0, 39.18], [42.0, 41.96], [42.0, 47.16], [48.0, 49.06], [50.0, 51.27], [52.0, 53.11], [54.0, 55.93], [56.0, 56.47], [57.0, 64.56], [68.0, 68.66], [70.0, 70.29], [76.0, 76.45], [79.0, 79.62], [81.0, 82.51], [86.0, 87.51], [89.0, 92.26], [94.0, 93.9], [97.0, 100.23], [101.0, 101.95], [107.0, 107.45], [110.0, 110.34], [116.0, 117.39]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.61, 0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 37.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 52.43], ["musical instrument", 5.62], ["echo", 5.28]], null, null, null, null, [["speech", 76.76], ["hum", 10.61], ["mains hum", 2.88]], null, null, null, null, null, [["speech", 78.54], ["sidetone", 2.56], ["thunk", 2.54]], null, null, null, null, null, null, [["throbbing", 15.15], ["hum", 12.73], ["music", 11.59]], null, null, null, null, null, null], "duration": [0.5, 1.48, 0.83, 14.09, 0.19, 0.39, 1.18, -0.04, 5.16, 1.06, 1.27, 1.11, 1.93, 0.47, 7.56, 0.66, 0.29, 0.45, 0.62, 1.51, 1.51, 3.26, -0.1, 3.23, 0.95, 0.45, 0.34, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/cgg9byUy-V4_filtered.json b/annotations_filtered/cgg9byUy-V4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c6a82a272a95d586522b661d980750f4df01913 --- /dev/null +++ b/annotations_filtered/cgg9byUy-V4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [6.0, 6.94], [7.0, 8.14], [11.0, 12.29], [16.0, 16.11], [21.0, 22.11], [38.0, 39.68], [41.0, 41.79], [44.0, 44.79], [46.0, 46.03], [47.0, 47.53], [50.0, 51.38], [58.0, 58.33], [59.0, 59.37], [60.0, 60.37], [70.0, 70.56], [89.0, 89.97], [93.0, 93.68], [97.0, 99.13], [104.0, 104.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.14, 0.94, 1.14, 1.29, 0.11, 1.11, 1.68, 0.79, 0.79, 0.03, 0.53, 1.38, 0.33, 0.37, 0.37, 0.56, 0.97, 0.68, 2.13, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/cglsMVVevx8_filtered.json b/annotations_filtered/cglsMVVevx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1a2c8c1b7f4e11e44b4a9889d33446d3c9c6a3 --- /dev/null +++ b/annotations_filtered/cglsMVVevx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [6.0, 9.19], [10.0, 10.0], [10.0, 11.75], [13.0, 13.0], [15.0, 14.88], [17.0, 17.42], [32.0, 32.73], [35.0, 35.24], [41.0, 42.21], [46.0, 53.05], [54.0, 67.66], [70.0, 71.73], [74.0, 75.69], [78.0, 78.54], [82.0, 84.35], [87.0, 148.22], [152.0, 154.47], [157.0, 177.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 39.58, 0.0, 0.0, 0.0, 34.78, 0.0, 34.12, 34.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.68], ["whack, thwack", 13.09], ["echo", 5.28]], null, null, null, [["music", 38.52], ["didgeridoo", 15.2], ["speech", 11.82]], null, [["trombone", 49.48], ["music", 15.02], ["brass instrument", 12.12]], [["music", 25.22], ["brass instrument", 13.64], ["trombone", 10.51]]], "duration": [0.38, 3.19, 0.0, 1.75, 0.0, -0.12, 0.42, 0.73, 0.24, 1.21, 7.05, 13.66, 1.73, 1.69, 0.54, 2.35, 61.22, 2.47, 20.06]} \ No newline at end of file diff --git a/annotations_filtered/cgoMJXAmLdc_filtered.json b/annotations_filtered/cgoMJXAmLdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96855a8343c74b7d4c7785f72d6e971b23ae8f4f --- /dev/null +++ b/annotations_filtered/cgoMJXAmLdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.82], [10.0, 10.52], [11.0, 11.77], [12.0, 25.83], [26.0, 27.13], [31.0, 33.62], [36.0, 36.31], [39.0, 39.83], [44.0, 45.18]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 0.0, 81.89, 0.0, 75.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.82, 0.52, 0.77, 13.83, 1.13, 2.62, 0.31, 0.83, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/cgogH0SylMc_filtered.json b/annotations_filtered/cgogH0SylMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c18d3587e9572a12a0e15743dd65d28d11113da3 --- /dev/null +++ b/annotations_filtered/cgogH0SylMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.34], [24.0, 24.41], [29.0, 29.44], [33.0, 33.62], [34.0, 36.56], [37.0, 40.29], [44.0, 44.0], [48.0, 63.37], [64.0, 64.15], [64.0, 64.25], [65.0, 65.99], [67.0, 67.41], [68.0, 69.92], [73.0, 74.76], [77.0, 79.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 83.34, 89.36, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.41, 0.44, 0.62, 2.56, 3.29, 0.0, 15.37, 0.15, 0.25, 0.99, 0.41, 1.92, 1.76, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/ch6zVPr6lWM_filtered.json b/annotations_filtered/ch6zVPr6lWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de35c44a350033d252cab520b5312af90a4ae094 --- /dev/null +++ b/annotations_filtered/ch6zVPr6lWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.16], [23.0, 25.24], [26.0, 27.01], [28.0, 29.47], [31.0, 32.16], [33.0, 39.83], [47.0, 49.96], [57.0, 57.52], [63.0, 63.21], [67.0, 68.93], [70.0, 71.29], [72.0, 81.16], [85.0, 86.0], [92.0, 94.85], [97.0, 97.92], [100.0, 99.87], [101.0, 104.65], [107.0, 107.15], [108.0, 109.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.0, 0.0, 0.0, 0.0, 64.29, 48.39, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 97.54, 0.0, 0.0, 95.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 63.88], ["eruption", 8.1], ["hum", 3.5]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 2.24, 1.01, 1.47, 1.16, 6.83, 2.96, 0.52, 0.21, 1.93, 1.29, 9.16, 1.0, 2.85, 0.92, -0.13, 3.65, 0.15, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/chBVj94zYDM_filtered.json b/annotations_filtered/chBVj94zYDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afc0d12afe292027bca23d46e8bdee1804a1f06a --- /dev/null +++ b/annotations_filtered/chBVj94zYDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.66], [16.0, 17.14], [24.0, 24.04], [25.0, 26.35], [34.0, 35.14], [36.0, 36.41], [36.0, 48.98], [50.0, 51.33], [54.0, 54.89], [57.0, 57.69], [61.0, 61.91], [63.0, 63.36], [65.0, 66.12], [69.0, 70.36], [74.0, 75.57], [78.0, 78.68], [81.0, 82.83], [88.0, 89.06], [89.0, 89.5], [90.0, 91.03], [95.0, 95.0], [101.0, 101.28], [106.0, 105.95], [114.0, 116.53], [117.0, 118.42], [119.0, 119.25], [123.0, 124.19], [126.0, 126.54], [128.0, 128.7]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.44], ["speech", 16.46], ["noise", 5.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.66, 1.14, 0.04, 1.35, 1.14, 0.41, 12.98, 1.33, 0.89, 0.69, 0.91, 0.36, 1.12, 1.36, 1.57, 0.68, 1.83, 1.06, 0.5, 1.03, 0.0, 0.28, -0.05, 2.53, 1.42, 0.25, 1.19, 0.54, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/ch_JeDyNaFM_filtered.json b/annotations_filtered/ch_JeDyNaFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9ccd4a7ecca2b4560cd47dafa263a68a59b1e1d --- /dev/null +++ b/annotations_filtered/ch_JeDyNaFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.59], [23.0, 38.06], [39.0, 176.57], [177.0, 178.41], [180.0, 184.6], [185.0, 191.71], [193.0, 196.01], [197.0, 198.93], [202.0, 202.53], [206.0, 227.37], [230.0, 233.58], [235.0, 235.38], [237.0, 237.52], [242.0, 243.4]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [29.58, 29.64, 0.0, 0.0, 40.07, 39.07, 53.28, 0.0, 0.0, 30.31, 38.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 47.54], ["throbbing", 34.45], ["mains hum", 8.52]], [["hum", 45.1], ["speech", 19.74], ["mains hum", 10.4]], null, null, [["hum", 35.0], ["throbbing", 18.06], ["mains hum", 17.11]], [["speech", 28.21], ["livestock, farm animals, working animals", 22.33], ["rumble", 8.05]], null, null, null, [["hum", 18.13], ["mains hum", 17.85], ["scary music", 16.32]], [["grunt", 20.06], ["music", 10.28], ["groan", 10.14]], null, null, null], "duration": [19.59, 15.06, 137.57, 1.41, 4.6, 6.71, 3.01, 1.93, 0.53, 21.37, 3.58, 0.38, 0.52, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/chlwxs2dfVA_filtered.json b/annotations_filtered/chlwxs2dfVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd05bb4932315b09423144a103b0606b926c62e5 --- /dev/null +++ b/annotations_filtered/chlwxs2dfVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 9.53], [11.0, 12.43], [13.0, 16.11], [17.0, 17.74], [19.0, 20.11], [21.0, 23.41], [25.0, 28.92], [30.0, 30.97], [33.0, 35.01], [36.0, 35.83], [36.0, 37.05], [39.0, 39.29], [40.0, 41.23], [43.0, 42.97], [44.0, 44.9], [46.0, 46.68], [49.0, 49.84], [51.0, 53.67], [55.0, 58.92], [60.0, 60.47], [61.0, 61.82], [63.0, 64.44], [65.0, 66.41], [69.0, 70.24], [73.0, 74.76], [76.0, 77.45], [78.0, 80.47], [81.0, 82.76], [84.0, 85.19], [86.0, 87.3], [89.0, 90.34], [91.0, 93.14], [95.0, 96.79], [98.0, 99.47], [100.0, 102.74], [104.0, 119.08], [120.0, 142.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.23, 0.0, 88.64, 0.0, 0.0, 95.78, 83.16, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 96.77, 38.93, 36.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.41], ["theremin", 37.57], ["gong", 2.49]], [["music", 48.75], ["theremin", 39.21], ["musical instrument", 3.81]]], "duration": [9.53, 1.43, 3.11, 0.74, 1.11, 2.41, 3.92, 0.97, 2.01, -0.17, 1.05, 0.29, 1.23, -0.03, 0.9, 0.68, 0.84, 2.67, 3.92, 0.47, 0.82, 1.44, 1.41, 1.24, 1.76, 1.45, 2.47, 1.76, 1.19, 1.3, 1.34, 2.14, 1.79, 1.47, 2.74, 15.08, 22.2]} \ No newline at end of file diff --git a/annotations_filtered/chvjkV0jRh8_filtered.json b/annotations_filtered/chvjkV0jRh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d159e311fc1b6335f3ce17cba084a6676cf363cc --- /dev/null +++ b/annotations_filtered/chvjkV0jRh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.21], [13.0, 21.02], [23.0, 28.24], [29.0, 31.16], [33.0, 47.01], [48.0, 68.35], [70.0, 69.9], [70.0, 70.97], [72.0, 72.28], [75.0, 75.42], [76.0, 78.9], [80.0, 81.65], [84.0, 83.94], [87.0, 88.01], [92.0, 94.83], [95.0, 97.46], [98.0, 98.58], [100.0, 99.81], [101.0, 100.99], [101.0, 105.39], [106.0, 112.55], [114.0, 114.32], [115.0, 117.58], [120.0, 123.33], [124.0, 125.27], [127.0, 127.08], [128.0, 129.36], [130.0, 131.38], [132.0, 143.99], [145.0, 146.31], [147.0, 148.39], [149.0, 150.42], [153.0, 171.48]], "keep_status": [true, true, false, true, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [33.01, 35.77, 38.45, 37.16, 33.71, 48.61, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 35.57, 32.18, 0.0, 0.0, 0.0, 33.54, 31.84, 0.0, 31.59, 29.47, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 30.98], "audiomae_on_audioset": [[["music", 46.29], ["theremin", 17.0], ["double bass", 6.44]], [["music", 45.33], ["double bass", 9.05], ["musical instrument", 7.2]], [["music", 61.69], ["theremin", 9.15], ["guitar", 4.02]], [["music", 50.01], ["foghorn", 10.19], ["ambient music", 3.74]], [["music", 83.31], ["musical instrument", 2.97], ["theremin", 2.81]], [["music", 45.03], ["double bass", 10.93], ["cello", 8.92]], null, null, null, null, [["music", 47.78], ["didgeridoo", 8.99], ["musical instrument", 7.88]], null, null, null, [["music", 50.77], ["theremin", 9.6], ["synthesizer", 5.18]], [["double bass", 28.89], ["music", 25.71], ["cello", 17.05]], null, null, null, [["music", 51.2], ["cello", 8.52], ["double bass", 8.22]], [["music", 38.13], ["cello", 25.3], ["double bass", 12.31]], null, [["cello", 33.88], ["music", 26.16], ["double bass", 12.63]], [["music", 46.98], ["musical instrument", 12.14], ["bowed string instrument", 10.4]], null, null, null, null, [["music", 58.56], ["musical instrument", 6.18], ["violin, fiddle", 5.83]], null, null, null, [["music", 64.28], ["throbbing", 5.87], ["hum", 5.13]]], "duration": [8.21, 8.02, 5.24, 2.16, 14.01, 20.35, -0.1, 0.97, 0.28, 0.42, 2.9, 1.65, -0.06, 1.01, 2.83, 2.46, 0.58, -0.19, -0.01, 4.39, 6.55, 0.32, 2.58, 3.33, 1.27, 0.08, 1.36, 1.38, 11.99, 1.31, 1.39, 1.42, 18.48]} \ No newline at end of file diff --git a/annotations_filtered/ciL0tWi56tM_filtered.json b/annotations_filtered/ciL0tWi56tM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c99c2eb2788e89cbadc12cbc4c95590f494602f --- /dev/null +++ b/annotations_filtered/ciL0tWi56tM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.6], [10.0, 20.07], [22.0, 23.7], [25.0, 90.19], [100.0, 118.99], [120.0, 120.56], [123.0, 141.57], [143.0, 149.25], [149.0, 150.6], [157.0, 165.4], [167.0, 168.59], [169.0, 180.03]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.77, 0.0, 0.0, 31.37, 0.0, 46.09, 30.0, 0.0, 31.28, 0.0, 31.94], "audiomae_on_audioset": [null, [["speech", 38.05], ["sheep", 9.52], ["bleat", 6.84]], null, null, [["music", 45.56], ["speech", 28.14], ["boing", 1.84]], null, [["whale vocalization", 99.52], ["gurgling", 0.12], ["music", 0.05]], [["speech", 43.69], ["music", 21.36], ["vehicle", 7.0]], null, [["speech", 38.32], ["music", 30.56], ["hubbub, speech noise, speech babble", 3.9]], null, [["speech", 48.37], ["foghorn", 18.95], ["music", 14.66]]], "duration": [1.6, 10.07, 1.7, 65.19, 18.99, 0.56, 18.57, 6.25, 1.6, 8.4, 1.59, 11.03]} \ No newline at end of file diff --git a/annotations_filtered/ciWBzhmOC_o_filtered.json b/annotations_filtered/ciWBzhmOC_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1f1a611c3178f5bd8c310e548b57ddec72b3941 --- /dev/null +++ b/annotations_filtered/ciWBzhmOC_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.86], [12.0, 13.15], [15.0, 15.4], [18.0, 18.35], [19.0, 20.46], [23.0, 23.48], [36.0, 36.75], [43.0, 43.83], [45.0, 45.6], [47.0, 47.7], [56.0, 58.75], [62.0, 63.88], [68.0, 69.47], [70.0, 70.28], [70.0, 71.51], [73.0, 76.82], [81.0, 85.19], [94.0, 101.87], [104.0, 105.34], [112.0, 111.65], [112.0, 112.43], [115.0, 117.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 66.15, 62.27, 61.87, 0.0, 0.0, 0.0, 62.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.15, 0.4, 0.35, 1.46, 0.48, 0.75, 0.83, 0.6, 0.7, 2.75, 1.88, 1.47, 0.28, 1.51, 3.82, 4.19, 7.87, 1.34, -0.35, 0.43, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/cibZY1GwVQg_filtered.json b/annotations_filtered/cibZY1GwVQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba5e9254cb788e8ece7fe313a8eea6e6704bad3a --- /dev/null +++ b/annotations_filtered/cibZY1GwVQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.99], [6.0, 6.51], [9.0, 8.9], [14.0, 14.64], [19.0, 19.26], [25.0, 26.05], [27.0, 28.38], [30.0, 36.09], [38.0, 38.96], [43.0, 44.64], [51.0, 51.12], [53.0, 53.03], [53.0, 54.38], [55.0, 58.13], [59.0, 60.81], [61.0, 62.88], [63.0, 63.02], [63.0, 63.36], [64.0, 64.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 0.51, -0.1, 0.64, 0.26, 1.05, 1.38, 6.09, 0.96, 1.64, 0.12, 0.03, 1.38, 3.13, 1.81, 1.88, 0.02, 0.36, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/cigrbhwjTnI_filtered.json b/annotations_filtered/cigrbhwjTnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/cigrbhwjTnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/cil6HFXlccw_filtered.json b/annotations_filtered/cil6HFXlccw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..204b4007982dd2cc4ef30ed6b729e1b952173c26 --- /dev/null +++ b/annotations_filtered/cil6HFXlccw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 41.39]], "keep_status": [true], "silence_prob": [32.94], "audiomae_on_audioset": [[["music", 34.72], ["speech", 12.69], ["vehicle", 10.06]]], "duration": [20.39]} \ No newline at end of file diff --git a/annotations_filtered/cio6rIbCs-I_filtered.json b/annotations_filtered/cio6rIbCs-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4a15b5fce4223112f50ad5a693afa52d330a5d --- /dev/null +++ b/annotations_filtered/cio6rIbCs-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.32], [10.0, 10.61], [11.0, 12.41], [15.0, 15.69], [17.0, 22.64], [23.0, 24.38], [25.0, 27.08], [29.0, 29.56], [31.0, 31.58], [33.0, 33.47], [35.0, 36.26], [37.0, 37.61], [39.0, 39.41], [40.0, 45.74], [47.0, 47.53], [48.0, 49.06], [50.0, 50.5], [51.0, 53.47], [54.0, 54.4], [55.0, 55.95], [57.0, 64.52], [69.0, 69.42], [71.0, 72.17], [73.0, 75.36], [76.0, 81.6], [87.0, 87.47], [91.0, 95.54], [96.0, 108.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false], "silence_prob": [50.36, 0.0, 0.0, 0.0, 49.5, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 45.05, 0.0, 0.0, 35.94, 46.79, 0.0, 58.13, 98.01], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 66.63], ["hum", 16.37], ["clang", 1.12]], null, [["sidetone", 67.92], ["speech", 17.44], ["dial tone", 2.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.48], ["didgeridoo", 23.61], ["noise", 4.98]], null, null, [["speech", 34.53], ["sidetone", 19.53], ["music", 12.33]], [["sidetone", 24.85], ["noise", 21.9], ["mains hum", 11.23]], null, null, null], "duration": [2.32, 0.61, 1.41, 0.69, 5.64, 1.38, 2.08, 0.56, 0.58, 0.47, 1.26, 0.61, 0.41, 5.74, 0.53, 1.06, 0.5, 2.47, 0.4, 0.95, 7.52, 0.42, 1.17, 2.36, 5.6, 0.47, 4.54, 12.94]} \ No newline at end of file diff --git a/annotations_filtered/cj5Mp68u2tY_filtered.json b/annotations_filtered/cj5Mp68u2tY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2804ae57f68028ac4becb48832afac311f2bb2 --- /dev/null +++ b/annotations_filtered/cj5Mp68u2tY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[109.0, 108.94], [110.0, 110.61], [111.0, 125.31]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.55], "audiomae_on_audioset": [null, null, [["music", 52.73], ["livestock, farm animals, working animals", 9.23], ["cattle, bovinae", 5.87]]], "duration": [-0.06, 0.61, 14.31]} \ No newline at end of file diff --git a/annotations_filtered/cjFIi3PC2cI_filtered.json b/annotations_filtered/cjFIi3PC2cI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f3b1b2e9ca48b016401f744291beab709e5c36e --- /dev/null +++ b/annotations_filtered/cjFIi3PC2cI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.16]], "keep_status": [false], "silence_prob": [83.52], "audiomae_on_audioset": [null], "duration": [3.16]} \ No newline at end of file diff --git a/annotations_filtered/cjS-Y6WsWMg_filtered.json b/annotations_filtered/cjS-Y6WsWMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8f65f735daa0e61271dd3c067ff0b07ea6d53e1 --- /dev/null +++ b/annotations_filtered/cjS-Y6WsWMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.65], [4.0, 15.96], [18.0, 18.37], [22.0, 27.14], [27.0, 28.29], [33.0, 33.13], [34.0, 54.01], [55.0, 63.17], [67.0, 67.69], [75.0, 77.46], [81.0, 124.28], [127.0, 127.84], [129.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.29, 68.67, 0.0, 80.64, 0.0, 0.0, 69.2, 70.02, 0.0, 92.8, 0.0, 0.0, 44.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 43.03], ["speech", 28.43], ["snicker", 3.6]]], "duration": [2.65, 11.96, 0.37, 5.14, 1.29, 0.13, 20.01, 8.17, 0.69, 2.46, 43.28, 0.84, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/cjkkKO5Gsno_filtered.json b/annotations_filtered/cjkkKO5Gsno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4fc1e469d97fa522e8d0de0ae8a73ed3ff9390 --- /dev/null +++ b/annotations_filtered/cjkkKO5Gsno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 28.49], [30.0, 30.27], [34.0, 45.03]], "keep_status": [false, false, true], "silence_prob": [30.24, 0.0, 30.95], "audiomae_on_audioset": [[["mains hum", 27.22], ["speech", 26.37], ["hum", 16.91]], null, [["speech", 38.16], ["hum", 10.59], ["electric shaver, electric razor", 9.36]]], "duration": [9.49, 0.27, 11.03]} \ No newline at end of file diff --git a/annotations_filtered/cjy-8dXBljk_filtered.json b/annotations_filtered/cjy-8dXBljk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0dc239f8981bba2ae5eed6949420c3df986adef --- /dev/null +++ b/annotations_filtered/cjy-8dXBljk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[108.0, 118.13], [120.0, 123.3], [126.0, 126.98], [129.0, 132.16], [133.0, 133.95], [136.0, 143.46], [144.0, 146.3], [147.0, 147.6], [149.0, 149.84]], "keep_status": [true, true, false, true, false, true, true, false, false], "silence_prob": [29.26, 30.66, 0.0, 29.09, 0.0, 29.54, 33.85, 0.0, 0.0], "audiomae_on_audioset": [[["music", 11.76], ["vehicle", 11.51], ["air horn, truck horn", 9.85]], [["mains hum", 30.28], ["hum", 19.42], ["throbbing", 18.45]], null, [["mains hum", 20.0], ["speech", 17.53], ["buzz", 10.84]], null, [["fly, housefly", 9.89], ["music", 6.55], ["electric shaver, electric razor", 6.46]], [["speech", 41.68], ["music", 8.78], ["vehicle", 6.68]], null, null], "duration": [10.13, 3.3, 0.98, 3.16, 0.95, 7.46, 2.3, 0.6, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/cjyqWsrpQAA_filtered.json b/annotations_filtered/cjyqWsrpQAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c4080b768bbb3a0b04eddf8e34d58d90b4fcbd2 --- /dev/null +++ b/annotations_filtered/cjyqWsrpQAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [9.0, 10.12], [11.0, 11.6], [13.0, 22.08], [24.0, 24.63], [27.0, 28.76], [30.0, 30.97], [32.0, 32.37], [34.0, 37.72], [44.0, 44.95], [47.0, 48.2]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.45, 0.0, 0.0, 0.0, 0.0, 33.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whip", 63.87], ["speech", 11.17], ["slap, smack", 4.0]], null, null, null, null, [["crushing", 30.35], ["door", 9.77], ["smash, crash", 5.85]], null, null], "duration": [0.94, 1.12, 0.6, 9.08, 0.63, 1.76, 0.97, 0.37, 3.72, 0.95, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/ckAD2sg5SxQ_filtered.json b/annotations_filtered/ckAD2sg5SxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc335eeee6efd4e378473f1987adf3cd17ffd38e --- /dev/null +++ b/annotations_filtered/ckAD2sg5SxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [6.0, 5.93], [8.0, 8.31], [14.0, 14.74], [26.0, 28.73], [29.0, 29.86], [40.0, 39.8], [41.0, 41.1], [43.0, 44.17], [52.0, 52.61], [54.0, 54.45], [55.0, 56.07], [56.0, 57.16], [58.0, 58.24], [60.0, 60.61], [62.0, 62.8], [64.0, 65.16], [67.0, 67.68], [73.0, 73.31], [75.0, 75.95], [87.0, 87.25], [88.0, 88.33], [89.0, 90.54], [91.0, 91.88], [93.0, 93.55], [95.0, 95.22], [97.0, 97.55], [100.0, 99.96], [103.0, 103.45], [106.0, 105.95], [107.0, 107.67], [110.0, 110.66], [112.0, 111.84], [113.0, 113.24], [115.0, 115.25], [117.0, 117.54], [118.0, 119.06], [120.0, 121.1], [122.0, 122.64], [123.0, 123.69], [125.0, 125.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, -0.07, 0.31, 0.74, 2.73, 0.86, -0.2, 0.1, 1.17, 0.61, 0.45, 1.07, 1.16, 0.24, 0.61, 0.8, 1.16, 0.68, 0.31, 0.95, 0.25, 0.33, 1.54, 0.88, 0.55, 0.22, 0.55, -0.04, 0.45, -0.05, 0.67, 0.66, -0.16, 0.24, 0.25, 0.54, 1.06, 1.1, 0.64, 0.69, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/ckjDSzjU-cQ_filtered.json b/annotations_filtered/ckjDSzjU-cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d928f20d53336cb0d450ecfbf5a6a6f0ea2988c5 --- /dev/null +++ b/annotations_filtered/ckjDSzjU-cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [7.0, 7.86], [9.0, 12.29], [13.0, 16.34], [17.0, 21.39], [23.0, 25.05], [27.0, 34.74], [35.0, 37.29], [39.0, 40.86], [41.0, 49.54], [51.0, 54.67], [55.0, 59.0], [60.0, 67.14], [71.0, 88.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 87.74, 82.25, 94.52, 55.04, 69.34, 59.42, 0.0, 50.66, 81.35, 47.74, 47.08, 29.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 41.71], ["theremin", 12.71], ["synthesizer", 5.28]], [["music", 50.76], ["speech", 30.7], ["caw", 2.36]], [["music", 34.31], ["ding", 10.35], ["doorbell", 9.52]]], "duration": [1.8, 0.86, 3.29, 3.34, 4.39, 2.05, 7.74, 2.29, 1.86, 8.54, 3.67, 4.0, 7.14, 17.28]} \ No newline at end of file diff --git a/annotations_filtered/cku1N8eCUlo_filtered.json b/annotations_filtered/cku1N8eCUlo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8e9b48acc3ad5f27d6ff61bfb63f5f0efa864ae --- /dev/null +++ b/annotations_filtered/cku1N8eCUlo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.11], [10.0, 13.24], [23.0, 66.24]], "keep_status": [false, false, false], "silence_prob": [83.52, 75.07, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [2.11, 3.24, 43.24]} \ No newline at end of file diff --git a/annotations_filtered/clDZPzwANeE_filtered.json b/annotations_filtered/clDZPzwANeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..687d557bcb88540b969fa05884c7474c21cfd4a9 --- /dev/null +++ b/annotations_filtered/clDZPzwANeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.91], [11.0, 10.88], [11.0, 19.63], [22.0, 28.92], [33.0, 33.45], [34.0, 36.41], [36.0, 38.33], [41.0, 46.99], [48.0, 50.25], [52.0, 55.32], [57.0, 59.31], [60.0, 61.37], [68.0, 68.67], [71.0, 71.69], [73.0, 78.07], [81.0, 82.38], [84.0, 86.44], [89.0, 93.46], [96.0, 98.76], [111.0, 118.35]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 46.5, 74.13, 0.0, 45.85, 43.45, 47.31, 62.68, 94.52, 70.44, 0.0, 0.0, 0.0, 39.28, 0.0, 76.2, 83.16, 97.54, 37.69], "audiomae_on_audioset": [null, null, [["speech", 77.13], ["hum", 3.05], ["whale vocalization", 1.87]], null, null, [["music", 25.88], ["hum", 16.26], ["throbbing", 11.31]], [["speech", 57.13], ["music", 5.12], ["inside, small room", 3.65]], [["sidetone", 26.77], ["speech", 23.75], ["dishes, pots, and pans", 6.38]], null, null, null, null, null, null, [["speech", 69.31], ["synthesizer", 6.61], ["music", 5.06]], null, null, null, null, [["thunk", 35.81], ["crushing", 14.65], ["hum", 5.17]]], "duration": [0.91, -0.12, 8.63, 6.92, 0.45, 2.41, 2.33, 5.99, 2.25, 3.32, 2.31, 1.37, 0.67, 0.69, 5.07, 1.38, 2.44, 4.46, 2.76, 7.35]} \ No newline at end of file diff --git a/annotations_filtered/clTG6sYtJig_filtered.json b/annotations_filtered/clTG6sYtJig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e5b43340a704214a1aafbd1cf43e4768e99324f --- /dev/null +++ b/annotations_filtered/clTG6sYtJig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.87], [19.0, 21.34], [23.0, 24.12], [26.0, 28.0], [33.0, 35.56], [37.0, 38.08], [41.0, 41.99], [48.0, 50.77], [52.0, 53.64], [55.0, 57.0], [58.0, 64.27], [66.0, 66.7], [68.0, 69.42], [71.0, 72.84], [74.0, 75.88], [77.0, 81.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 0.0, 99.71, 100.0, 0.0, 0.0, 99.8, 0.0, 99.99, 99.8, 0.0, 0.0, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 2.34, 1.12, 2.0, 2.56, 1.08, 0.99, 2.77, 1.64, 2.0, 6.27, 0.7, 1.42, 1.84, 1.88, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/clr6zsehoTg_filtered.json b/annotations_filtered/clr6zsehoTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a6924f3d988a3c3183f39a0a42c4149342e524a --- /dev/null +++ b/annotations_filtered/clr6zsehoTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [11.0, 11.03], [14.0, 14.76], [15.0, 15.63], [24.0, 23.73], [29.0, 30.47], [31.0, 32.81], [36.0, 38.48], [43.0, 43.9], [53.0, 54.18], [54.0, 55.38], [65.0, 65.48], [66.0, 66.85], [74.0, 74.51], [79.0, 79.07], [86.0, 85.85], [88.0, 88.42], [91.0, 91.4], [92.0, 93.43], [94.0, 96.21], [98.0, 100.65], [102.0, 103.94], [104.0, 106.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97, 49.36, 0.0, 36.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.03], ["hum", 18.05], ["music", 12.42]], [["music", 37.9], ["speech", 11.76], ["hum", 7.5]], null, [["speech", 34.29], ["music", 25.69], ["hum", 5.41]]], "duration": [0.35, 0.03, 0.76, 0.63, -0.27, 1.47, 1.81, 2.48, 0.9, 1.18, 1.38, 0.48, 0.85, 0.51, 0.07, -0.15, 0.42, 0.4, 1.43, 2.21, 2.65, 1.94, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/cm1NBLlRxy0_filtered.json b/annotations_filtered/cm1NBLlRxy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..062e3cf24b90a569a4bc6c64b90ecaae24b77bd4 --- /dev/null +++ b/annotations_filtered/cm1NBLlRxy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.71], [24.0, 27.16], [27.0, 27.24], [27.0, 30.0], [42.0, 42.53], [45.0, 45.28], [46.0, 46.79], [68.0, 68.37], [72.0, 72.39], [77.0, 87.89], [96.0, 96.3], [97.0, 104.45], [105.0, 105.46], [120.0, 120.33], [121.0, 122.1], [122.0, 151.97], [167.0, 167.21], [171.0, 180.77], [193.0, 194.51], [195.0, 197.9], [206.0, 207.17], [208.0, 213.66], [217.0, 217.17], [219.0, 226.4]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.16, 30.33, 0.0, 30.5, 0.0, 0.0, 0.0, 0.0, 0.0, 33.98, 0.0, 30.88, 0.0, 0.0, 0.0, 29.52, 0.0, 29.55, 0.0, 30.09, 0.0, 30.4, 0.0, 30.76], "audiomae_on_audioset": [[["music", 43.12], ["speech", 19.45], ["didgeridoo", 5.13]], [["moo", 23.47], ["cattle, bovinae", 22.23], ["music", 17.13]], null, [["music", 63.54], ["speech", 6.33], ["didgeridoo", 5.39]], null, null, null, null, null, [["music", 70.66], ["didgeridoo", 7.98], ["speech", 5.99]], null, [["music", 36.34], ["speech", 25.7], ["cattle, bovinae", 3.82]], null, null, null, [["cattle, bovinae", 31.2], ["moo", 28.85], ["livestock, farm animals, working animals", 14.51]], null, [["cattle, bovinae", 30.2], ["moo", 27.6], ["music", 15.16]], null, [["didgeridoo", 43.92], ["music", 26.04], ["musical instrument", 4.6]], null, [["music", 61.19], ["musical instrument", 4.88], ["didgeridoo", 4.49]], null, [["music", 55.89], ["didgeridoo", 12.62], ["synthesizer", 5.62]]], "duration": [4.71, 3.16, 0.24, 3.0, 0.53, 0.28, 0.79, 0.37, 0.39, 10.89, 0.3, 7.45, 0.46, 0.33, 1.1, 29.97, 0.21, 9.77, 1.51, 2.9, 1.17, 5.66, 0.17, 7.4]} \ No newline at end of file diff --git a/annotations_filtered/cmBN-X701Gg_filtered.json b/annotations_filtered/cmBN-X701Gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f70e4de6f8eed9cec1c911d80bb49eeab547010 --- /dev/null +++ b/annotations_filtered/cmBN-X701Gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.49], [11.0, 13.42], [15.0, 15.96], [18.0, 20.11], [22.0, 24.29], [27.0, 34.91], [36.0, 36.26], [38.0, 38.8], [40.0, 41.4], [44.0, 44.14], [46.0, 46.35], [50.0, 50.65], [53.0, 53.52], [56.0, 56.89], [58.0, 58.51], [60.0, 63.51], [66.0, 72.54], [76.0, 76.54], [77.0, 77.48], [80.0, 81.43], [82.0, 85.16], [86.0, 86.24], [89.0, 89.83], [91.0, 92.55], [93.0, 94.58], [97.0, 97.87], [108.0, 109.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.78, 99.31, 0.0, 100.0, 99.97, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 86.09, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.49, 2.42, 0.96, 2.11, 2.29, 7.91, 0.26, 0.8, 1.4, 0.14, 0.35, 0.65, 0.52, 0.89, 0.51, 3.51, 6.54, 0.54, 0.48, 1.43, 3.16, 0.24, 0.83, 1.55, 1.58, 0.87, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/cmYsRcLMvO8_filtered.json b/annotations_filtered/cmYsRcLMvO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..908a12c837024a3e549963d519835e1c84886f37 --- /dev/null +++ b/annotations_filtered/cmYsRcLMvO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.95], [25.0, 73.97], [75.0, 90.51], [91.0, 91.64], [93.0, 95.74], [96.0, 96.79], [98.0, 101.02], [106.0, 108.06], [109.0, 110.05], [111.0, 118.18], [121.0, 152.71], [153.0, 153.87], [158.0, 179.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.48, 0.0, 99.96, 0.0, 98.99, 81.71, 0.0, 99.93, 0.0, 0.0, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.95, 48.97, 15.51, 0.64, 2.74, 0.79, 3.02, 2.06, 1.05, 7.18, 31.71, 0.87, 21.68]} \ No newline at end of file diff --git a/annotations_filtered/cmgeSY8YdO4_filtered.json b/annotations_filtered/cmgeSY8YdO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c812e170d18137ddb1634f77761dc29b4b76bc7d --- /dev/null +++ b/annotations_filtered/cmgeSY8YdO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [16.0, 16.36], [21.0, 22.03], [25.0, 25.76], [35.0, 34.82], [37.0, 40.15], [46.0, 48.15], [49.0, 50.23], [52.0, 52.73], [59.0, 59.98], [62.0, 62.78], [64.0, 63.9], [79.0, 78.87], [80.0, 81.24], [83.0, 84.18], [85.0, 86.31], [87.0, 87.1], [88.0, 90.09], [104.0, 107.42], [108.0, 108.38], [112.0, 112.62], [113.0, 113.7], [115.0, 116.13], [117.0, 119.64], [123.0, 137.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.09, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.56, 38.49, 0.0, 0.0, 0.0, 0.0, 97.92, 50.61], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 60.43], ["dishes, pots, and pans", 8.02], ["sidetone", 5.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 33.15], ["speech", 27.88], ["guitar", 2.38]], [["speech", 17.02], ["fart", 14.88], ["fireworks", 6.54]], null, null, null, null, null, null], "duration": [1.25, 0.36, 1.03, 0.76, -0.18, 3.15, 2.15, 1.23, 0.73, 0.98, 0.78, -0.1, -0.13, 1.24, 1.18, 1.31, 0.1, 2.09, 3.42, 0.38, 0.62, 0.7, 1.13, 2.64, 14.46]} \ No newline at end of file diff --git a/annotations_filtered/cmkZeTX5fq0_filtered.json b/annotations_filtered/cmkZeTX5fq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15d1b7f01fd5e913adcd902d3a5cf91ec6fd6bf8 --- /dev/null +++ b/annotations_filtered/cmkZeTX5fq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [21.0, 22.62], [31.0, 35.58], [40.0, 41.84], [62.0, 170.61], [174.0, 174.12], [177.0, 179.39], [185.0, 188.52], [190.0, 190.49], [191.0, 191.57], [192.0, 192.64], [195.0, 197.68], [198.0, 199.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 99.96, 89.72, 0.0, 0.0, 0.0, 98.8, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.97], ["didgeridoo", 13.24], ["electronic music", 1.79]], null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 1.62, 4.58, 1.84, 108.61, 0.12, 2.39, 3.52, 0.49, 0.57, 0.64, 2.68, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/cmlELkvVPeQ_filtered.json b/annotations_filtered/cmlELkvVPeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de697dafdebe46f643f4c4dcfe94b700b29769bd --- /dev/null +++ b/annotations_filtered/cmlELkvVPeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [5.0, 5.14], [9.0, 9.39], [11.0, 11.94], [33.0, 33.05], [39.0, 39.82], [49.0, 48.64], [49.0, 51.14], [51.0, 53.43], [54.0, 55.71], [66.0, 66.55], [68.0, 67.85], [72.0, 74.71], [75.0, 75.68], [80.0, 81.11], [86.0, 87.08], [89.0, 88.74], [94.0, 94.44], [100.0, 99.91], [122.0, 123.35], [127.0, 127.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 89.72, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.14, 0.39, 0.94, 0.05, 0.82, -0.36, 2.14, 2.43, 1.71, 0.55, -0.15, 2.71, 0.68, 1.11, 1.08, -0.26, 0.44, -0.09, 1.35, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/cmtXA6x6Jm4_filtered.json b/annotations_filtered/cmtXA6x6Jm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa5564cf0bf71b6d69b1264f909de8c2493afd03 --- /dev/null +++ b/annotations_filtered/cmtXA6x6Jm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.37], [19.0, 19.62], [20.0, 20.66], [21.0, 24.66], [27.0, 27.51], [28.0, 35.9], [38.0, 39.66], [41.0, 40.88], [47.0, 48.59], [51.0, 51.31], [52.0, 52.08], [54.0, 69.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.3, 0.0, 0.0, 99.8, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.37, 0.62, 0.66, 3.66, 0.51, 7.9, 1.66, -0.12, 1.59, 0.31, 0.08, 15.09]} \ No newline at end of file diff --git a/annotations_filtered/cn35LhT9zBg_filtered.json b/annotations_filtered/cn35LhT9zBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..337ebe0c0ccf71547bb07143e20f525a1352afcc --- /dev/null +++ b/annotations_filtered/cn35LhT9zBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 31.6], [32.0, 59.16], [60.0, 61.1], [65.0, 78.65], [82.0, 82.44], [83.0, 83.51], [84.0, 91.25], [94.0, 95.1], [97.0, 98.71], [102.0, 105.81], [109.0, 111.18], [114.0, 117.04]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [35.31, 29.49, 0.0, 30.4, 0.0, 0.0, 33.08, 0.0, 0.0, 39.5, 99.99, 30.02], "audiomae_on_audioset": [[["music", 31.28], ["electric shaver, electric razor", 11.27], ["livestock, farm animals, working animals", 5.55]], [["speech", 34.45], ["music", 21.04], ["gong", 3.54]], null, [["hum", 37.88], ["throbbing", 28.06], ["music", 15.15]], null, null, [["speech", 39.61], ["music", 6.74], ["theremin", 6.54]], null, null, [["speech", 52.81], ["beatboxing", 16.77], ["music", 2.37]], null, [["explosion", 44.99], ["burst, pop", 22.74], ["breaking", 4.75]]], "duration": [14.6, 27.16, 1.1, 13.65, 0.44, 0.51, 7.25, 1.1, 1.71, 3.81, 2.18, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/cnM9pdjp5o4_filtered.json b/annotations_filtered/cnM9pdjp5o4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ceba763c3ba280bab7f5c2cfcb4ddd4f481b0d1 --- /dev/null +++ b/annotations_filtered/cnM9pdjp5o4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [4.0, 5.76], [6.0, 6.59], [14.0, 21.1], [30.0, 37.25], [45.0, 52.89], [54.0, 61.08], [62.0, 65.4], [69.0, 76.86], [79.0, 79.32], [86.0, 85.9], [90.0, 91.1]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.45, 31.55, 36.11, 33.11, 32.23, 37.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["ding", 55.17], ["music", 15.44], ["speech", 15.02]], [["music", 81.36], ["boing", 1.52], ["funny music", 1.1]], [["music", 80.27], ["funk", 2.14], ["singing", 1.08]], [["music", 75.09], ["firecracker", 4.18], ["speech", 2.57]], [["music", 26.43], ["mosquito", 22.62], ["cattle, bovinae", 8.23]], [["music", 80.94], ["speech", 7.24], ["boing", 1.83]], null, null, null], "duration": [0.22, 1.76, 0.59, 7.1, 7.25, 7.89, 7.08, 3.4, 7.86, 0.32, -0.1, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/cnQEo4bazIo_filtered.json b/annotations_filtered/cnQEo4bazIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7111919e3aa90e09b64cbf8109fe07a73b9ce938 --- /dev/null +++ b/annotations_filtered/cnQEo4bazIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.07], [9.0, 17.12], [20.0, 20.07], [20.0, 20.11], [20.0, 20.14], [20.0, 30.57], [31.0, 34.18], [36.0, 37.03], [38.0, 75.17], [84.0, 91.34]], "keep_status": [false, false, false, false, false, false, true, false, false, true], "silence_prob": [95.51, 57.17, 0.0, 0.0, 0.0, 39.63, 31.2, 0.0, 0.0, 35.44], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.68], ["snicker", 29.27], ["chuckle, chortle", 2.61]], [["music", 40.03], ["speech", 10.56], ["whack, thwack", 7.03]], null, null, [["music", 38.74], ["speech", 22.76], ["foghorn", 3.93]]], "duration": [2.07, 8.12, 0.07, 0.11, 0.14, 10.57, 3.18, 1.03, 37.17, 7.34]} \ No newline at end of file diff --git a/annotations_filtered/cneoNgk9dhM_filtered.json b/annotations_filtered/cneoNgk9dhM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85d9784ac934578d8f459a8723f0fa690481b597 --- /dev/null +++ b/annotations_filtered/cneoNgk9dhM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.82], [21.0, 36.41], [40.0, 63.49], [64.0, 66.46], [68.0, 99.37]], "keep_status": [true, false, false, false, false], "silence_prob": [28.63, 28.88, 28.66, 28.8, 0.0], "audiomae_on_audioset": [[["music", 36.76], ["theremin", 6.0], ["mains hum", 5.56]], [["hum", 39.01], ["mains hum", 37.4], ["music", 8.37]], [["noise", 48.4], ["music", 22.07], ["mains hum", 2.86]], [["zipper (clothing)", 34.3], ["music", 31.36], ["didgeridoo", 5.4]], null], "duration": [9.82, 15.41, 23.49, 2.46, 31.37]} \ No newline at end of file diff --git a/annotations_filtered/cniwN1YsUW8_filtered.json b/annotations_filtered/cniwN1YsUW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..859d9a13bd7f3ac5ab5acc174c3901cb73758b1e --- /dev/null +++ b/annotations_filtered/cniwN1YsUW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 34.08], [37.0, 45.6], [48.0, 57.33], [60.0, 70.5], [82.0, 86.02], [87.0, 87.74], [92.0, 113.59], [115.0, 117.0], [120.0, 131.41], [136.0, 136.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.08, 29.95, 28.97, 29.09, 30.84, 0.0, 29.3, 31.49, 29.24, 0.0], "audiomae_on_audioset": [[["speech", 39.1], ["music", 26.85], ["hum", 8.23]], [["music", 45.02], ["speech", 31.16], ["vehicle", 3.23]], [["music", 73.3], ["throbbing", 4.3], ["electronic music", 3.88]], [["speech", 49.51], ["music", 29.46], ["hum", 4.15]], [["music", 35.53], ["speech", 30.96], ["hum", 6.18]], null, [["music", 62.21], ["hum", 8.48], ["mains hum", 7.21]], [["music", 36.56], ["throbbing", 24.67], ["hum", 19.88]], [["music", 63.07], ["electronic music", 6.96], ["trance music", 6.1]], null], "duration": [6.08, 8.6, 9.33, 10.5, 4.02, 0.74, 21.59, 2.0, 11.41, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/cnvdC5TGc3g_filtered.json b/annotations_filtered/cnvdC5TGc3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/cnvdC5TGc3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/cnwddNSgakk_filtered.json b/annotations_filtered/cnwddNSgakk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1631a2ffab3b25ce518046fcba444b3c9926d880 --- /dev/null +++ b/annotations_filtered/cnwddNSgakk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.85], [21.0, 21.69], [25.0, 26.03], [28.0, 36.1], [38.0, 37.96], [50.0, 52.54], [56.0, 72.13], [74.0, 74.55], [75.0, 76.0], [81.0, 81.62], [89.0, 89.26], [91.0, 94.8], [104.0, 104.53], [115.0, 115.8], [130.0, 141.4], [143.0, 143.43], [144.0, 145.49], [149.0, 157.82], [161.0, 166.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.3, 0.0, 45.43, 30.07, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0, 30.27, 0.0, 0.0, 33.08, 31.21], "audiomae_on_audioset": [null, null, null, [["music", 62.36], ["synthesizer", 9.93], ["musical instrument", 4.73]], null, [["music", 52.67], ["synthesizer", 19.51], ["musical instrument", 10.73]], [["music", 55.38], ["synthesizer", 15.71], ["theremin", 13.32]], null, null, null, null, [["sidetone", 19.04], ["music", 12.08], ["speech", 11.06]], null, null, [["music", 49.04], ["hum", 12.63], ["theremin", 6.2]], null, null, [["music", 76.7], ["synthesizer", 5.44], ["sampler", 3.25]], [["music", 69.01], ["synthesizer", 8.99], ["musical instrument", 8.38]]], "duration": [1.85, 0.69, 1.03, 8.1, -0.04, 2.54, 16.13, 0.55, 1.0, 0.62, 0.26, 3.8, 0.53, 0.8, 11.4, 0.43, 1.49, 8.82, 5.09]} \ No newline at end of file diff --git a/annotations_filtered/coDtzN6bXAM_filtered.json b/annotations_filtered/coDtzN6bXAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08691b7051f9386cab7dc54ee605633536411573 --- /dev/null +++ b/annotations_filtered/coDtzN6bXAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.43], [9.0, 16.9], [18.0, 22.0], [25.0, 27.92], [28.0, 34.43], [36.0, 37.44], [39.0, 39.9], [43.0, 43.38], [54.0, 56.84], [58.0, 58.36], [67.0, 67.46], [69.0, 69.87], [77.0, 81.5], [82.0, 82.88], [86.0, 86.32], [92.0, 92.85], [96.0, 97.39], [98.0, 98.96], [103.0, 107.32], [110.0, 112.04], [115.0, 116.31], [122.0, 123.96], [126.0, 126.67], [128.0, 130.3], [131.0, 138.59]], "keep_status": [true, false, true, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [46.22, 54.43, 36.23, 33.67, 38.74, 0.0, 0.0, 0.0, 42.02, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 35.94, 44.52, 0.0, 0.0, 0.0, 36.72, 39.04], "audiomae_on_audioset": [[["music", 23.17], ["speech", 12.37], ["hum", 11.89]], null, [["hum", 25.23], ["mains hum", 13.02], ["chirp tone", 9.5]], [["speech", 26.64], ["howl", 24.66], ["animal", 12.37]], [["speech", 56.99], ["music", 7.74], ["animal", 7.42]], null, null, null, [["music", 24.72], ["sidetone", 13.59], ["throbbing", 12.59]], null, null, null, [["music", 51.39], ["whale vocalization", 6.63], ["musical instrument", 6.24]], null, null, null, null, null, [["music", 57.93], ["speech", 13.26], ["synthesizer", 6.07]], [["music", 55.31], ["synthesizer", 10.34], ["hum", 4.09]], null, null, null, [["music", 58.93], ["speech", 17.8], ["mains hum", 5.47]], [["music", 36.84], ["hum", 14.97], ["throbbing", 10.09]]], "duration": [2.43, 7.9, 4.0, 2.92, 6.43, 1.44, 0.9, 0.38, 2.84, 0.36, 0.46, 0.87, 4.5, 0.88, 0.32, 0.85, 1.39, 0.96, 4.32, 2.04, 1.31, 1.96, 0.67, 2.3, 7.59]} \ No newline at end of file diff --git a/annotations_filtered/coOguh0UhcY_filtered.json b/annotations_filtered/coOguh0UhcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca29262d248fba21bc3427db131b9e85f4936cb5 --- /dev/null +++ b/annotations_filtered/coOguh0UhcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 72.42], [73.0, 73.41], [74.0, 74.21], [75.0, 75.17], [76.0, 78.92], [80.0, 82.95], [84.0, 85.01], [86.0, 91.96], [94.0, 94.09], [95.0, 95.72], [98.0, 98.54], [101.0, 101.65], [104.0, 105.24], [108.0, 108.09], [108.0, 108.6], [109.0, 110.66], [111.0, 111.97], [113.0, 130.2], [133.0, 133.51], [135.0, 134.79], [136.0, 136.44], [137.0, 141.78]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.07, 99.96, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 0.0, 33.62], "audiomae_on_audioset": [null, null, null, null, [["fart", 38.5], ["creak", 20.85], ["sound effect", 10.43]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 19.07], ["sidetone", 13.07], ["didgeridoo", 11.39]], null, null, null, [["speech", 19.31], ["roar", 10.88], ["animal", 5.82]]], "duration": [53.42, 0.41, 0.21, 0.17, 2.92, 2.95, 1.01, 5.96, 0.09, 0.72, 0.54, 0.65, 1.24, 0.09, 0.6, 1.66, 0.97, 17.2, 0.51, -0.21, 0.44, 4.78]} \ No newline at end of file diff --git a/annotations_filtered/coWFeBI9XoQ_filtered.json b/annotations_filtered/coWFeBI9XoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da6d8ed68810a3fca4862b74da968d1db72e429c --- /dev/null +++ b/annotations_filtered/coWFeBI9XoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 28.22], [33.0, 89.36]], "keep_status": [false, false], "silence_prob": [59.96, 0.0], "audiomae_on_audioset": [null, null], "duration": [3.22, 56.36]} \ No newline at end of file diff --git a/annotations_filtered/coeU38xEhVU_filtered.json b/annotations_filtered/coeU38xEhVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd4daa81f0210beca14faa82235d2ad3cba4ad4 --- /dev/null +++ b/annotations_filtered/coeU38xEhVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [6.0, 5.8], [9.0, 9.12], [11.0, 12.61], [13.0, 13.76], [23.0, 24.12], [25.0, 26.72], [37.0, 38.2], [40.0, 47.41], [49.0, 76.28], [77.0, 113.81], [115.0, 120.46], [126.0, 137.93], [139.0, 143.78], [144.0, 145.57], [147.0, 148.26], [149.0, 151.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.21, 30.95, 0.0, 31.49, 30.48, 38.03, 0.0, 0.0, 47.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 45.23], ["speech", 21.56], ["theremin", 13.6]], [["cattle, bovinae", 32.44], ["music", 16.22], ["moo", 12.98]], null, [["music", 53.5], ["didgeridoo", 10.14], ["speech", 6.77]], [["music", 44.86], ["speech", 13.36], ["didgeridoo", 7.53]], [["music", 22.84], ["throbbing", 21.74], ["hum", 17.92]], null, null, [["speech", 27.61], ["heart sounds, heartbeat", 3.92], ["eruption", 2.78]]], "duration": [1.67, -0.2, 0.12, 1.61, 0.76, 1.12, 1.72, 1.2, 7.41, 27.28, 36.81, 5.46, 11.93, 4.78, 1.57, 1.26, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/corlGzKJqAc_filtered.json b/annotations_filtered/corlGzKJqAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..662a133168a969b982296bc6fd18e58a5fc0c3cb --- /dev/null +++ b/annotations_filtered/corlGzKJqAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.7], [12.0, 13.41], [15.0, 15.43], [20.0, 20.61], [24.0, 24.66], [27.0, 28.04], [30.0, 30.77], [37.0, 37.77], [40.0, 40.81], [43.0, 43.78], [45.0, 46.38], [48.0, 48.54], [53.0, 53.84], [59.0, 59.37], [67.0, 68.62], [71.0, 71.49], [75.0, 76.38], [87.0, 86.88], [90.0, 90.53], [95.0, 95.82], [97.0, 98.05], [101.0, 101.17], [105.0, 105.63], [109.0, 110.22], [113.0, 112.97], [115.0, 117.53], [119.0, 119.2], [121.0, 121.73], [137.0, 138.0], [150.0, 152.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 38.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.97], ["thunk", 11.39], ["wind instrument, woodwind instrument", 8.2]]], "duration": [0.7, 1.41, 0.43, 0.61, 0.66, 1.04, 0.77, 0.77, 0.81, 0.78, 1.38, 0.54, 0.84, 0.37, 1.62, 0.49, 1.38, -0.12, 0.53, 0.82, 1.05, 0.17, 0.63, 1.22, -0.03, 2.53, 0.2, 0.73, 1.0, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/cpO3ALFscmQ_filtered.json b/annotations_filtered/cpO3ALFscmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca12c824309fb38cd9f03375808957eb16bf30c --- /dev/null +++ b/annotations_filtered/cpO3ALFscmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.9], [12.0, 23.14], [27.0, 26.82], [28.0, 35.9], [37.0, 37.99], [39.0, 38.92], [40.0, 40.68], [43.0, 46.68], [47.0, 62.45], [63.0, 62.95]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 34.68, 0.0, 71.0, 0.0, 0.0, 0.0, 33.44, 32.37, 0.0], "audiomae_on_audioset": [null, [["music", 68.16], ["throbbing", 8.85], ["synthesizer", 4.29]], null, null, null, null, null, [["music", 52.91], ["throbbing", 9.38], ["synthesizer", 7.95]], [["music", 30.38], ["gong", 24.69], ["speech", 10.03]], null], "duration": [0.9, 11.14, -0.18, 7.9, 0.99, -0.08, 0.68, 3.68, 15.45, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/cpQQpn89mEs_filtered.json b/annotations_filtered/cpQQpn89mEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b91000cb4602be82eeeb62d3e91b5b38afa1dafe --- /dev/null +++ b/annotations_filtered/cpQQpn89mEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.85], [13.0, 13.54], [26.0, 29.05], [30.0, 31.62], [35.0, 40.2], [41.0, 41.91], [46.0, 51.71], [54.0, 57.23], [58.0, 59.39], [61.0, 62.97], [64.0, 64.67], [66.0, 70.41], [71.0, 72.13], [74.0, 74.49], [78.0, 78.36], [81.0, 82.76], [84.0, 104.72], [106.0, 114.1], [115.0, 125.1], [126.0, 129.09]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true], "silence_prob": [0.0, 0.0, 80.64, 0.0, 41.26, 0.0, 79.07, 76.53, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 32.04, 32.52, 33.08, 30.42], "audiomae_on_audioset": [null, null, null, null, [["breaking", 41.64], ["music", 14.27], ["speech", 13.1]], null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 27.31], ["breaking", 23.76], ["smash, crash", 4.98]], [["animal", 26.64], ["livestock, farm animals, working animals", 19.28], ["wild animals", 18.15]], [["speech", 23.38], ["music", 15.91], ["grunt", 8.52]], [["music", 34.95], ["speech", 17.02], ["sound effect", 3.22]]], "duration": [-0.15, 0.54, 3.05, 1.62, 5.2, 0.91, 5.71, 3.23, 1.39, 1.97, 0.67, 4.41, 1.13, 0.49, 0.36, 1.76, 20.72, 8.1, 10.1, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/cpZIiyp8juU_filtered.json b/annotations_filtered/cpZIiyp8juU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c1bfc646a708f24c5383df5c4001b95513d8dfd --- /dev/null +++ b/annotations_filtered/cpZIiyp8juU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [7.0, 18.89], [21.0, 26.28], [27.0, 27.09], [33.0, 139.19], [145.0, 153.86], [155.0, 162.06], [162.0, 170.58], [172.0, 171.98], [173.0, 174.75], [178.0, 190.24], [192.0, 205.63]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 33.28, 30.3, 0.0, 0.0, 30.35, 29.74, 29.94, 0.0, 0.0, 30.0, 30.63], "audiomae_on_audioset": [null, [["hum", 22.29], ["music", 19.68], ["didgeridoo", 19.06]], [["speech", 52.53], ["didgeridoo", 8.49], ["hum", 7.17]], null, null, [["moo", 39.07], ["cattle, bovinae", 24.98], ["livestock, farm animals, working animals", 18.14]], [["music", 46.7], ["didgeridoo", 19.03], ["speech", 11.47]], [["music", 65.47], ["didgeridoo", 12.23], ["speech", 7.81]], null, null, [["mains hum", 28.93], ["hum", 22.97], ["music", 17.3]], [["speech", 21.5], ["cattle, bovinae", 10.83], ["music", 9.82]]], "duration": [0.19, 11.89, 5.28, 0.09, 106.19, 8.86, 7.06, 8.58, -0.02, 1.75, 12.24, 13.63]} \ No newline at end of file diff --git a/annotations_filtered/cqD8XBONBHY_filtered.json b/annotations_filtered/cqD8XBONBHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aee1971b8c4179744416f487477473b4f0210739 --- /dev/null +++ b/annotations_filtered/cqD8XBONBHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [10.0, 22.92], [25.0, 37.84], [41.0, 45.08], [45.0, 46.18], [47.0, 47.61], [49.0, 88.32], [103.0, 107.05], [108.0, 114.13], [115.0, 150.84], [152.0, 159.19], [163.0, 164.64], [173.0, 173.69], [175.0, 175.07]], "keep_status": [false, true, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 41.38, 34.85, 36.79, 0.0, 0.0, 0.0, 38.98, 48.1, 0.0, 31.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 29.41], ["music", 20.23], ["throbbing", 8.01]], [["music", 59.01], ["throbbing", 14.15], ["electronic music", 6.23]], [["music", 71.96], ["musical instrument", 5.73], ["effects unit", 3.97]], null, null, null, [["music", 37.87], ["synthesizer", 7.96], ["musical instrument", 5.76]], [["music", 26.42], ["synthesizer", 17.23], ["theremin", 7.1]], null, [["speech", 50.65], ["music", 14.22], ["sound effect", 5.9]], null, null, null], "duration": [1.02, 12.92, 12.84, 4.08, 1.18, 0.61, 39.32, 4.05, 6.13, 35.84, 7.19, 1.64, 0.69, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/cqHKducp4MY_filtered.json b/annotations_filtered/cqHKducp4MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f6c8c2ee5ec0b85d3cbbc0d45f7cc11a9c532c9 --- /dev/null +++ b/annotations_filtered/cqHKducp4MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.01]], "keep_status": [false], "silence_prob": [32.98], "audiomae_on_audioset": [[["throbbing", 46.47], ["hum", 32.59], ["music", 10.29]]], "duration": [3.01]} \ No newline at end of file diff --git a/annotations_filtered/cqOc4yl1bIw_filtered.json b/annotations_filtered/cqOc4yl1bIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd8cc6dc827e440a13ad61d0657597b403866403 --- /dev/null +++ b/annotations_filtered/cqOc4yl1bIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.44], [19.0, 21.44], [23.0, 24.76], [27.0, 30.82], [33.0, 33.59], [34.0, 35.18], [36.0, 37.71], [40.0, 65.67], [66.0, 65.94], [75.0, 75.66], [77.0, 77.04], [81.0, 80.94], [90.0, 91.49], [98.0, 98.66], [103.0, 106.07], [110.0, 110.39], [113.0, 113.48], [116.0, 121.93], [123.0, 123.72], [131.0, 131.28], [132.0, 132.87], [134.0, 136.22], [142.0, 147.36]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.29, 0.0, 69.88, 0.0, 0.0, 0.0, 31.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.8, 0.0, 0.0, 35.57, 0.0, 0.0, 0.0, 63.85, 50.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["gunshot, gunfire", 39.07], ["artillery fire", 9.51], ["music", 5.98]], null, null, null, null, null, null, [["hum", 50.88], ["mains hum", 11.23], ["throbbing", 11.18]], null, null, [["crushing", 69.46], ["speech", 8.9], ["sidetone", 5.5]], null, null, null, null, null], "duration": [1.44, 2.44, 1.76, 3.82, 0.59, 1.18, 1.71, 25.67, -0.06, 0.66, 0.04, -0.06, 1.49, 0.66, 3.07, 0.39, 0.48, 5.93, 0.72, 0.28, 0.87, 2.22, 5.36]} \ No newline at end of file diff --git a/annotations_filtered/cqiQmO5frrE_filtered.json b/annotations_filtered/cqiQmO5frrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b3904bc03e8c9b12806e28cc0eaffb54430c20e --- /dev/null +++ b/annotations_filtered/cqiQmO5frrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [3.0, 3.52], [4.0, 24.9], [29.0, 46.13], [49.0, 49.91], [52.0, 52.49], [53.0, 61.94], [64.0, 106.79], [109.0, 110.51], [115.0, 116.51]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 34.25, 36.41, 0.0, 0.0, 33.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 84.08], ["speech", 6.1], ["drum machine", 3.4]], [["music", 60.99], ["sidetone", 10.95], ["speech", 10.45]], null, null, [["music", 47.08], ["boing", 14.52], ["speech", 4.45]], null, null, null], "duration": [0.38, 0.52, 20.9, 17.13, 0.91, 0.49, 8.94, 42.79, 1.51, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/cqpvoIx9wbw_filtered.json b/annotations_filtered/cqpvoIx9wbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/cqpvoIx9wbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/cr13B4L-5-M_filtered.json b/annotations_filtered/cr13B4L-5-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cd6f9ce82c8d02fa12c1bb2c6f17e8a71082197 --- /dev/null +++ b/annotations_filtered/cr13B4L-5-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.11], [26.0, 27.38]], "keep_status": [true, false], "silence_prob": [33.18, 0.0], "audiomae_on_audioset": [[["music", 55.96], ["throbbing", 4.69], ["fly, housefly", 4.31]], null], "duration": [13.11, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/crB4KD3p8HU_filtered.json b/annotations_filtered/crB4KD3p8HU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ce7cfa96bd3928465da6389aa612c13dabd78d9 --- /dev/null +++ b/annotations_filtered/crB4KD3p8HU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 93.77], [94.0, 98.24], [99.0, 101.36], [105.0, 106.42], [108.0, 110.89]], "keep_status": [false, false, false, false, false], "silence_prob": [37.46, 87.37, 73.06, 0.0, 89.19], "audiomae_on_audioset": [[["music", 66.66], ["speech", 5.57], ["ambient music", 5.4]], null, null, null, null], "duration": [26.77, 4.24, 2.36, 1.42, 2.89]} \ No newline at end of file diff --git a/annotations_filtered/crBqPflvzyQ_filtered.json b/annotations_filtered/crBqPflvzyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0b92154bc53afdda4a74a75fa2a902be016dad4 --- /dev/null +++ b/annotations_filtered/crBqPflvzyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.43], [21.0, 22.49], [24.0, 24.58], [27.0, 27.78], [31.0, 32.04], [38.0, 38.99], [46.0, 46.04], [48.0, 48.95], [56.0, 56.54], [57.0, 58.53], [62.0, 62.72], [64.0, 102.44], [104.0, 105.21], [107.0, 112.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.59], ["speech", 19.28], ["explosion", 8.92]]], "duration": [2.43, 1.49, 0.58, 0.78, 1.04, 0.99, 0.04, 0.95, 0.54, 1.53, 0.72, 38.44, 1.21, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/crI67brUX84_filtered.json b/annotations_filtered/crI67brUX84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f2d975f311da7e68e19a93fff189adb9079b725 --- /dev/null +++ b/annotations_filtered/crI67brUX84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.02], [17.0, 16.65], [19.0, 19.99], [21.0, 22.62], [23.0, 24.07], [26.0, 30.81], [32.0, 38.37], [39.0, 39.85], [41.0, 42.28], [43.0, 44.39], [49.0, 49.22], [51.0, 54.16], [60.0, 61.65], [63.0, 63.44], [69.0, 72.03], [78.0, 78.88], [83.0, 84.86], [86.0, 86.7], [92.0, 93.24], [94.0, 95.37], [99.0, 99.47], [112.0, 122.52], [124.0, 124.95], [127.0, 127.57], [129.0, 130.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 0.0, 0.0, 82.25, 99.95, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 38.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 47.1], ["speech", 22.9], ["sine wave", 4.84]], null, null, null, null, null, null, null, null, null, null], "duration": [2.02, -0.35, 0.99, 1.62, 1.07, 4.81, 6.37, 0.85, 1.28, 1.39, 0.22, 3.16, 1.65, 0.44, 3.03, 0.88, 1.86, 0.7, 1.24, 1.37, 0.47, 10.52, 0.95, 0.57, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/crIlIvBYMoc_filtered.json b/annotations_filtered/crIlIvBYMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8df0f910252e8794b410d773e987a9a80ad1d0a --- /dev/null +++ b/annotations_filtered/crIlIvBYMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 41.15], [42.0, 50.67], [58.0, 60.71], [62.0, 65.23], [68.0, 71.83], [75.0, 77.09], [80.0, 81.65], [82.0, 87.62], [89.0, 102.32], [104.0, 107.82], [110.0, 111.84], [113.0, 114.34], [115.0, 116.51], [118.0, 119.99], [126.0, 128.34]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.76, 38.16, 32.94, 28.37, 49.5, 0.0, 76.04, 98.93, 98.86, 0.0, 0.0, 0.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 40.89], ["moo", 17.98], ["speech", 11.03]], [["whale vocalization", 58.56], ["cattle, bovinae", 13.55], ["livestock, farm animals, working animals", 13.14]], [["music", 9.23], ["boom", 8.84], ["whack, thwack", 8.07]], [["speech", 21.14], ["animal", 6.05], ["smash, crash", 5.76]], null, null, null, null, null, null, null, null, null], "duration": [31.15, 8.67, 2.71, 3.23, 3.83, 2.09, 1.65, 5.62, 13.32, 3.82, 1.84, 1.34, 1.51, 1.99, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/crKAy2dGX_8_filtered.json b/annotations_filtered/crKAy2dGX_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131346fac4cbc596382542a86e2d64c2b02e03ee --- /dev/null +++ b/annotations_filtered/crKAy2dGX_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.82]], "keep_status": [false], "silence_prob": [56.33], "audiomae_on_audioset": [null], "duration": [3.82]} \ No newline at end of file diff --git a/annotations_filtered/crPJvv2Y3hk_filtered.json b/annotations_filtered/crPJvv2Y3hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e2ccc5e51b4d08d3702d4d75e971856cfdcf322 --- /dev/null +++ b/annotations_filtered/crPJvv2Y3hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [12.0, 13.78], [18.0, 18.86], [20.0, 57.82], [58.0, 57.94], [58.0, 58.5], [60.0, 60.54], [62.0, 106.41]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.45, 1.78, 0.86, 37.82, -0.06, 0.5, 0.54, 44.41]} \ No newline at end of file diff --git a/annotations_filtered/crZXwRmMq2k_filtered.json b/annotations_filtered/crZXwRmMq2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2557330a4daabdc38765148814cf05fa8233909a --- /dev/null +++ b/annotations_filtered/crZXwRmMq2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [5.0, 5.64], [7.0, 7.38], [8.0, 7.97], [10.0, 11.21], [14.0, 18.49], [23.0, 23.62], [26.0, 43.11], [44.0, 66.55], [71.0, 114.54], [116.0, 118.23]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 30.83, 29.69, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 26.08], ["hum", 20.63], ["music", 16.04]], [["hum", 54.97], ["mains hum", 28.23], ["speech", 6.67]], null, null], "duration": [0.76, 0.64, 0.38, -0.03, 1.21, 4.49, 0.62, 17.11, 22.55, 43.54, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/cs7CW6xDbL8_filtered.json b/annotations_filtered/cs7CW6xDbL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aad0dfff6d72102ea2e2485416b4bf7ba7044670 --- /dev/null +++ b/annotations_filtered/cs7CW6xDbL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 30.65], [33.0, 33.42], [34.0, 47.73], [53.0, 70.95]], "keep_status": [false, false, true, true], "silence_prob": [29.87, 0.0, 30.43, 30.01], "audiomae_on_audioset": [[["music", 50.08], ["throbbing", 16.96], ["hum", 10.39]], null, [["hum", 28.24], ["mains hum", 21.7], ["music", 16.68]], [["music", 31.67], ["hum", 14.32], ["mains hum", 10.06]]], "duration": [14.65, 0.42, 13.73, 17.95]} \ No newline at end of file diff --git a/annotations_filtered/cslI2draO_E_filtered.json b/annotations_filtered/cslI2draO_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac34ced775d104c71f794e3351032d4a0862d9f7 --- /dev/null +++ b/annotations_filtered/cslI2draO_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.79], [18.0, 22.15], [26.0, 26.13], [30.0, 30.81], [38.0, 38.57], [43.0, 44.83], [46.0, 46.8], [48.0, 53.49], [54.0, 55.78], [57.0, 58.16], [61.0, 61.77], [62.0, 63.69], [66.0, 71.04], [73.0, 74.09], [77.0, 79.03], [80.0, 81.14], [82.0, 83.25], [84.0, 85.29], [89.0, 90.24], [91.0, 92.58], [98.0, 103.13], [105.0, 110.22], [118.0, 120.11], [126.0, 141.76]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 46.29, 0.0, 0.0, 0.0, 0.0, 0.0, 31.8, 29.58, 35.81, 29.3], "audiomae_on_audioset": [null, [["noise", 27.71], ["music", 24.07], ["whale vocalization", 6.68]], null, null, null, null, null, [["hum", 24.71], ["speech", 21.12], ["music", 9.45]], null, null, null, null, [["music", 56.48], ["hum", 8.21], ["whale vocalization", 4.9]], null, [["hoot", 37.59], ["owl", 36.17], ["music", 8.97]], null, null, null, null, null, [["hum", 25.67], ["music", 15.11], ["throbbing", 7.79]], [["groan", 17.17], ["music", 15.6], ["livestock, farm animals, working animals", 11.41]], [["sidetone", 70.65], ["music", 10.63], ["speech", 3.29]], [["music", 33.1], ["explosion", 7.32], ["speech", 7.28]]], "duration": [1.79, 4.15, 0.13, 0.81, 0.57, 1.83, 0.8, 5.49, 1.78, 1.16, 0.77, 1.69, 5.04, 1.09, 2.03, 1.14, 1.25, 1.29, 1.24, 1.58, 5.13, 5.22, 2.11, 15.76]} \ No newline at end of file diff --git a/annotations_filtered/ct-PElgfWJY_filtered.json b/annotations_filtered/ct-PElgfWJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d63cfea125825d9d89a2e554463d3c3b933b20a1 --- /dev/null +++ b/annotations_filtered/ct-PElgfWJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 21.09], [23.0, 47.8], [50.0, 65.85], [72.0, 78.49], [82.0, 88.26], [90.0, 92.13], [94.0, 132.83], [133.0, 146.42], [147.0, 148.39], [150.0, 154.67], [157.0, 158.63], [161.0, 174.5], [175.0, 177.25]], "keep_status": [false, true, false, false, true, true, false, true, false, true, false, true, true], "silence_prob": [94.95, 31.18, 30.0, 30.36, 36.71, 40.24, 0.0, 31.02, 0.0, 31.61, 0.0, 29.23, 29.57], "audiomae_on_audioset": [null, [["music", 42.18], ["speech", 9.75], ["hum", 4.52]], [["speech", 68.19], ["music", 4.45], ["hum", 4.16]], [["music", 54.24], ["cacophony", 14.86], ["hum", 4.42]], [["music", 23.78], ["speech", 17.66], ["cacophony", 9.03]], [["music", 49.34], ["synthesizer", 12.17], ["busy signal", 6.83]], null, [["music", 31.2], ["rumble", 10.57], ["noise", 8.51]], null, [["speech", 16.31], ["music", 16.02], ["explosion", 7.4]], null, [["speech", 41.08], ["music", 9.54], ["buzz", 6.0]], [["vehicle", 31.23], ["car", 18.8], ["race car, auto racing", 11.94]]], "duration": [13.09, 24.8, 15.85, 6.49, 6.26, 2.13, 38.83, 13.42, 1.39, 4.67, 1.63, 13.5, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/ct7Ox_OKe-s_filtered.json b/annotations_filtered/ct7Ox_OKe-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51d04de79b8fb7213aa31df6fb7b7d8bf3a7ac54 --- /dev/null +++ b/annotations_filtered/ct7Ox_OKe-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 31.31], [32.0, 52.98], [55.0, 55.51], [59.0, 63.88], [69.0, 69.16], [70.0, 78.51], [80.0, 80.05], [81.0, 81.46], [83.0, 90.42], [91.0, 91.96], [93.0, 93.82], [95.0, 95.15], [97.0, 98.56], [101.0, 101.56], [103.0, 119.89]], "keep_status": [true, true, false, true, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [32.06, 32.69, 0.0, 33.42, 0.0, 33.16, 0.0, 0.0, 31.41, 0.0, 0.0, 0.0, 0.0, 0.0, 31.87], "audiomae_on_audioset": [[["shofar", 34.74], ["theremin", 11.34], ["music", 11.1]], [["music", 30.12], ["brass instrument", 15.65], ["saxophone", 11.12]], null, [["music", 21.07], ["foghorn", 9.37], ["trombone", 7.6]], null, [["music", 36.45], ["insect", 10.86], ["wind instrument, woodwind instrument", 6.27]], null, null, [["music", 45.59], ["wind instrument, woodwind instrument", 11.17], ["musical instrument", 8.17]], null, null, null, null, null, [["music", 33.63], ["theremin", 24.09], ["brass instrument", 15.33]]], "duration": [8.31, 20.98, 0.51, 4.88, 0.16, 8.51, 0.05, 0.46, 7.42, 0.96, 0.82, 0.15, 1.56, 0.56, 16.89]} \ No newline at end of file diff --git a/annotations_filtered/ctTSLWXE58o_filtered.json b/annotations_filtered/ctTSLWXE58o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96c1037ce98dabe932041761ade346d94d1f56cc --- /dev/null +++ b/annotations_filtered/ctTSLWXE58o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [23.0, 23.95], [35.0, 36.37], [37.0, 37.81], [42.0, 42.25], [46.0, 47.07], [51.0, 55.24], [56.0, 56.17], [60.0, 61.4], [62.0, 63.98], [65.0, 66.58], [71.0, 72.62], [74.0, 75.29], [78.0, 78.6], [79.0, 85.35], [86.0, 95.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 32.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.84], ["rumble", 7.36], ["sidetone", 5.7]]], "duration": [0.05, 0.95, 1.37, 0.81, 0.25, 1.07, 4.24, 0.17, 1.4, 1.98, 1.58, 1.62, 1.29, 0.6, 6.35, 9.08]} \ No newline at end of file diff --git a/annotations_filtered/ctd3NPx1pdM_filtered.json b/annotations_filtered/ctd3NPx1pdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40c20cede90a8862f71d43c49a3aa7c805311d3c --- /dev/null +++ b/annotations_filtered/ctd3NPx1pdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [4.0, 4.41], [5.0, 7.26], [9.0, 17.07], [19.0, 18.81], [20.0, 20.44], [21.0, 21.22], [21.0, 29.08], [30.0, 30.4], [32.0, 34.55], [35.0, 36.9], [38.0, 39.33], [40.0, 41.35], [42.0, 45.91], [50.0, 50.77], [53.0, 56.25], [59.0, 59.48], [61.0, 62.5], [65.0, 66.38], [67.0, 69.75], [74.0, 74.56], [77.0, 77.41], [79.0, 78.81], [82.0, 82.58], [84.0, 84.96], [89.0, 89.43], [92.0, 92.15], [93.0, 97.53], [98.0, 99.47], [101.0, 102.37], [113.0, 113.02], [114.0, 117.98], [120.0, 120.41], [123.0, 123.9], [126.0, 126.72], [136.0, 137.64], [139.0, 139.92], [143.0, 144.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.98, 58.38, 0.0, 0.0, 0.0, 62.89, 0.0, 91.98, 0.0, 0.0, 0.0, 67.51, 0.0, 99.88, 0.0, 0.0, 0.0, 34.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.72], ["telephone", 17.84], ["busy signal", 6.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.41, 2.26, 8.07, -0.19, 0.44, 0.22, 8.08, 0.4, 2.55, 1.9, 1.33, 1.35, 3.91, 0.77, 3.25, 0.48, 1.5, 1.38, 2.75, 0.56, 0.41, -0.19, 0.58, 0.96, 0.43, 0.15, 4.53, 1.47, 1.37, 0.02, 3.98, 0.41, 0.9, 0.72, 1.64, 0.92, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/ctjucF9fiFw_filtered.json b/annotations_filtered/ctjucF9fiFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69b2e51d9e865911c4470c579c78a98b23f931d --- /dev/null +++ b/annotations_filtered/ctjucF9fiFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 25.35], [26.0, 26.64], [27.0, 27.94], [36.0, 37.42], [39.0, 41.28], [46.0, 50.53], [59.0, 62.34], [67.0, 72.08], [75.0, 77.79], [80.0, 83.15], [84.0, 84.97], [85.0, 86.61], [94.0, 93.9], [96.0, 100.92]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [36.24, 0.0, 0.0, 0.0, 41.34, 29.62, 36.76, 70.3, 33.7, 41.6, 0.0, 0.0, 0.0, 30.62], "audiomae_on_audioset": [[["music", 40.59], ["hum", 19.49], ["throbbing", 5.56]], null, null, null, [["music", 65.69], ["speech", 16.8], ["electronic music", 2.27]], [["music", 32.2], ["hum", 23.85], ["mains hum", 15.43]], [["throbbing", 39.22], ["hum", 22.28], ["music", 8.47]], null, [["music", 37.96], ["glass", 16.01], ["breaking", 11.16]], [["music", 63.97], ["musical instrument", 6.53], ["didgeridoo", 5.51]], null, null, null, [["music", 53.29], ["boing", 7.55], ["sound effect", 5.08]]], "duration": [10.35, 0.64, 0.94, 1.42, 2.28, 4.53, 3.34, 5.08, 2.79, 3.15, 0.97, 1.61, -0.1, 4.92]} \ No newline at end of file diff --git a/annotations_filtered/ctrJ0-TLUHQ_filtered.json b/annotations_filtered/ctrJ0-TLUHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0911c472cef8d9d7e0f50c52518f05df5294411f --- /dev/null +++ b/annotations_filtered/ctrJ0-TLUHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [7.0, 8.07], [12.0, 13.27], [18.0, 18.23], [26.0, 27.5], [29.0, 29.84], [32.0, 33.74], [39.0, 39.29], [43.0, 43.8], [45.0, 47.75], [56.0, 56.46], [57.0, 57.45], [58.0, 58.92], [80.0, 80.92], [86.0, 86.59], [102.0, 103.72], [109.0, 113.14], [114.0, 125.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.23, 43.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 26.13], ["insect", 17.69], ["whale vocalization", 6.67]]], "duration": [0.44, 1.07, 1.27, 0.23, 1.5, 0.84, 1.74, 0.29, 0.8, 2.75, 0.46, 0.45, 0.92, 0.92, 0.59, 1.72, 4.14, 11.34]} \ No newline at end of file diff --git a/annotations_filtered/ctyDL-6f90w_filtered.json b/annotations_filtered/ctyDL-6f90w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0ab9dff1504c4599949883666769c9c3fab328b --- /dev/null +++ b/annotations_filtered/ctyDL-6f90w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.47], [40.0, 41.18], [43.0, 46.92], [49.0, 49.71], [55.0, 83.52], [100.0, 100.21], [113.0, 131.18], [132.0, 132.61]], "keep_status": [true, false, true, false, true, false, false, false], "silence_prob": [39.15, 0.0, 33.71, 0.0, 32.5, 0.0, 36.67, 0.0], "audiomae_on_audioset": [[["hum", 19.83], ["mains hum", 6.0], ["livestock, farm animals, working animals", 5.88]], null, [["speech", 33.02], ["explosion", 19.94], ["burst, pop", 5.9]], null, [["buzz", 17.89], ["explosion", 7.87], ["cacophony", 5.89]], null, [["whale vocalization", 53.2], ["hum", 14.78], ["mains hum", 9.19]], null], "duration": [4.47, 1.18, 3.92, 0.71, 28.52, 0.21, 18.18, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/cuK7JbG06ho_filtered.json b/annotations_filtered/cuK7JbG06ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3274e68f2c76df32baff5920251291181000eeab --- /dev/null +++ b/annotations_filtered/cuK7JbG06ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.26], [21.0, 22.2], [24.0, 24.11], [26.0, 30.16], [31.0, 32.36], [35.0, 35.95], [44.0, 43.85], [48.0, 53.91], [55.0, 55.48], [57.0, 57.52], [60.0, 60.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.48, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.26, 1.2, 0.11, 4.16, 1.36, 0.95, -0.15, 5.91, 0.48, 0.52, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/cu_A-aG8G7U_filtered.json b/annotations_filtered/cu_A-aG8G7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae1e9c0042343752a2fd19f5c737ffb92e46c754 --- /dev/null +++ b/annotations_filtered/cu_A-aG8G7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.63], [13.0, 15.7], [21.0, 22.54], [27.0, 26.96], [28.0, 28.16], [36.0, 43.82], [57.0, 57.81], [59.0, 59.68], [73.0, 73.4], [82.0, 89.14], [91.0, 91.12], [91.0, 94.36], [100.0, 105.8], [110.0, 122.03], [123.0, 123.42], [125.0, 125.58], [129.0, 143.72], [149.0, 149.76], [151.0, 156.24], [157.0, 157.77], [159.0, 170.78], [172.0, 173.16], [174.0, 178.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.08, 0.0, 0.0, 0.0, 45.02, 0.0, 0.0, 0.0, 30.66, 0.0, 34.5, 31.2, 37.86, 0.0, 0.0, 41.07, 0.0, 38.97, 0.0, 46.4, 0.0, 57.64], "audiomae_on_audioset": [null, [["speech", 62.22], ["radio", 10.59], ["sidetone", 8.63]], null, null, null, [["fly, housefly", 55.02], ["insect", 17.98], ["bee, wasp, etc.", 7.78]], null, null, null, [["speech", 17.02], ["livestock, farm animals, working animals", 15.05], ["cattle, bovinae", 10.0]], null, [["sidetone", 34.92], ["music", 27.44], ["speech", 10.25]], [["music", 41.72], ["didgeridoo", 26.15], ["speech", 10.14]], [["didgeridoo", 26.57], ["fly, housefly", 19.26], ["music", 13.78]], null, null, [["music", 70.61], ["didgeridoo", 5.77], ["musical instrument", 5.29]], null, [["music", 60.09], ["sidetone", 7.9], ["musical instrument", 6.54]], null, [["music", 60.03], ["speech", 8.76], ["sidetone", 3.85]], null, null], "duration": [0.63, 2.7, 1.54, -0.04, 0.16, 7.82, 0.81, 0.68, 0.4, 7.14, 0.12, 3.36, 5.8, 12.03, 0.42, 0.58, 14.72, 0.76, 5.24, 0.77, 11.78, 1.16, 4.82]} \ No newline at end of file diff --git a/annotations_filtered/cudAGo1nSKI_filtered.json b/annotations_filtered/cudAGo1nSKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af8396df71389487f37867e1ba57a6a0c48c3d73 --- /dev/null +++ b/annotations_filtered/cudAGo1nSKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.67], [5.0, 7.06], [8.0, 12.88], [14.0, 23.79], [24.0, 25.29], [26.0, 47.53]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 99.87, 100.0, 99.73, 0.0, 99.93], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.67, 2.06, 4.88, 9.79, 1.29, 21.53]} \ No newline at end of file diff --git a/annotations_filtered/cv62uysSvQE_filtered.json b/annotations_filtered/cv62uysSvQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d6edf3ac8881b81d92914ff6342c54376962351 --- /dev/null +++ b/annotations_filtered/cv62uysSvQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [26.0, 28.65], [31.0, 31.35], [33.0, 33.34], [39.0, 39.56], [41.0, 42.84], [43.0, 42.87], [43.0, 43.44], [43.0, 43.48], [43.0, 43.66], [44.0, 51.49], [54.0, 55.0], [64.0, 95.1], [96.0, 96.74], [97.0, 102.14]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.34, 30.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.13, 0.0, 0.0, 0.0, 65.55], "audiomae_on_audioset": [[["music", 70.06], ["theremin", 3.73], ["radio", 3.54]], [["eruption", 18.34], ["explosion", 17.5], ["music", 15.51]], null, null, null, null, null, null, null, null, [["music", 71.5], ["musical instrument", 5.73], ["marimba, xylophone", 2.27]], null, null, null, null], "duration": [2.16, 2.65, 0.35, 0.34, 0.56, 1.84, -0.13, 0.44, 0.48, 0.66, 7.49, 1.0, 31.1, 0.74, 5.14]} \ No newline at end of file diff --git a/annotations_filtered/cv7_7dSbaOk_filtered.json b/annotations_filtered/cv7_7dSbaOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d83f95bc9a64af57c1f2760c0212963569add7d5 --- /dev/null +++ b/annotations_filtered/cv7_7dSbaOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.01], [16.0, 22.2], [27.0, 34.6], [37.0, 42.74], [43.0, 43.44], [43.0, 50.63], [53.0, 69.18], [71.0, 73.53], [75.0, 78.09], [83.0, 94.86], [100.0, 101.21], [103.0, 120.07], [122.0, 122.86]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [54.1, 69.88, 68.28, 59.33, 0.0, 34.55, 31.99, 38.52, 33.37, 34.93, 0.0, 52.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 70.93], ["hum", 8.29], ["electronic music", 2.84]], [["fly, housefly", 40.37], ["mosquito", 40.36], ["insect", 15.44]], [["whale vocalization", 17.27], ["music", 14.81], ["hum", 13.54]], [["music", 42.76], ["hum", 7.41], ["theremin", 4.68]], [["music", 68.57], ["hoot", 4.14], ["theremin", 2.83]], null, null, null], "duration": [2.01, 6.2, 7.6, 5.74, 0.44, 7.63, 16.18, 2.53, 3.09, 11.86, 1.21, 17.07, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/cv8yjJQg4Nc_filtered.json b/annotations_filtered/cv8yjJQg4Nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3af38033af164bf371d0687a15eccb20c45d3de --- /dev/null +++ b/annotations_filtered/cv8yjJQg4Nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [4.0, 3.55], [7.0, 8.19], [12.0, 13.05], [14.0, 14.99], [17.0, 17.24], [20.0, 20.88], [23.0, 24.48], [26.0, 28.11], [49.0, 49.1], [53.0, 53.74], [55.0, 55.43], [61.0, 61.45], [76.0, 78.11]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.91, 0.0, 0.0, 0.0, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["echo", 49.91], ["effects unit", 9.28], ["reverberation", 7.12]], null, null, null, null, null], "duration": [0.04, -0.45, 1.19, 1.05, 0.99, 0.24, 0.88, 1.48, 2.11, 0.1, 0.74, 0.43, 0.45, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/cvEJy_9hy4o_filtered.json b/annotations_filtered/cvEJy_9hy4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7e93141788944df303edb354e62db70cc5b50de --- /dev/null +++ b/annotations_filtered/cvEJy_9hy4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [8.0, 8.61], [10.0, 10.99], [12.0, 12.85], [14.0, 15.28], [17.0, 17.96], [19.0, 20.56], [22.0, 24.97], [27.0, 28.12], [43.0, 43.77], [48.0, 49.35], [53.0, 53.08], [55.0, 56.32], [63.0, 63.64], [68.0, 69.16], [70.0, 70.95], [84.0, 85.19], [92.0, 92.52], [94.0, 95.81], [99.0, 98.98], [101.0, 106.41], [107.0, 109.73], [111.0, 112.08], [113.0, 115.35], [116.0, 119.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.31, 71.29, 0.0, 86.45, 66.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.61, 0.99, 0.85, 1.28, 0.96, 1.56, 2.97, 1.12, 0.77, 1.35, 0.08, 1.32, 0.64, 1.16, 0.95, 1.19, 0.52, 1.81, -0.02, 5.41, 2.73, 1.08, 2.35, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/cvNjYmDiV0Y_filtered.json b/annotations_filtered/cvNjYmDiV0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92f0d30165524eb512a523afffa08b213e2a3242 --- /dev/null +++ b/annotations_filtered/cvNjYmDiV0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [10.0, 12.83], [15.0, 15.58], [17.0, 19.38], [21.0, 23.36], [28.0, 28.41], [32.0, 32.58], [35.0, 36.51], [38.0, 39.5], [40.0, 80.35], [81.0, 84.6], [85.0, 107.05], [107.0, 115.53], [116.0, 115.62], [116.0, 116.01], [121.0, 124.16], [125.0, 139.63], [146.0, 147.19], [148.0, 149.03], [150.0, 150.18], [150.0, 150.85], [160.0, 160.62], [165.0, 166.68], [167.0, 168.15], [170.0, 170.92], [173.0, 175.17], [176.0, 179.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.03, 0.0, 67.63, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 36.23, 40.12, 31.11, 0.0, 0.0, 32.26, 31.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 75.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["thunk", 46.54], ["music", 30.27], ["knock", 5.25]], [["music", 37.25], ["fly, housefly", 10.98], ["effects unit", 7.18]], [["whack, thwack", 21.6], ["gong", 11.37], ["breaking", 10.31]], null, null, [["cattle, bovinae", 33.31], ["moo", 26.76], ["livestock, farm animals, working animals", 16.6]], [["animal", 20.66], ["cattle, bovinae", 17.34], ["moo", 9.14]], null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.83, 0.58, 2.38, 2.36, 0.41, 0.58, 1.51, 1.5, 40.35, 3.6, 22.05, 8.53, -0.38, 0.01, 3.16, 14.63, 1.19, 1.03, 0.18, 0.85, 0.62, 1.68, 1.15, 0.92, 2.17, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/cvPIBkkwvD4_filtered.json b/annotations_filtered/cvPIBkkwvD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eac1c6fd437b5e1139b1345fa1f72959c449831c --- /dev/null +++ b/annotations_filtered/cvPIBkkwvD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.47], [12.0, 13.07], [18.0, 20.04], [21.0, 21.74], [22.0, 22.71], [23.0, 30.74], [33.0, 33.3], [39.0, 41.55], [43.0, 52.54], [53.0, 54.19], [63.0, 70.85], [74.0, 81.45]], "keep_status": [false, false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [29.83, 0.0, 38.16, 0.0, 0.0, 38.51, 0.0, 63.53, 38.14, 0.0, 35.84, 34.73], "audiomae_on_audioset": [[["explosion", 38.59], ["speech", 26.31], ["music", 10.14]], null, [["music", 22.76], ["speech", 14.56], ["sheep", 7.12]], null, null, [["whale vocalization", 30.33], ["buzz", 11.84], ["hum", 11.35]], null, null, [["music", 21.05], ["whale vocalization", 9.46], ["explosion", 5.63]], null, [["speech", 61.55], ["whale vocalization", 15.92], ["music", 10.94]], [["music", 67.07], ["speech", 19.91], ["musical instrument", 3.62]]], "duration": [3.47, 1.07, 2.04, 0.74, 0.71, 7.74, 0.3, 2.55, 9.54, 1.19, 7.85, 7.45]} \ No newline at end of file diff --git a/annotations_filtered/cvakyq_EaWY_filtered.json b/annotations_filtered/cvakyq_EaWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..104d27ce75d23b3630b856cb5089cd41c5647649 --- /dev/null +++ b/annotations_filtered/cvakyq_EaWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [4.0, 5.98], [9.0, 9.53], [12.0, 12.87], [14.0, 14.62], [15.0, 16.09], [33.0, 33.54], [34.0, 35.45], [54.0, 55.05], [64.0, 66.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.6, 1.98, 0.53, 0.87, 0.62, 1.09, 0.54, 1.45, 1.05, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/cvmcGY_VwvU_filtered.json b/annotations_filtered/cvmcGY_VwvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c6aaaaf5bde74411179738360912444279d9967 --- /dev/null +++ b/annotations_filtered/cvmcGY_VwvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 36.39], [38.0, 44.81], [54.0, 54.63], [56.0, 57.16], [61.0, 61.72], [62.0, 62.88], [66.0, 67.12], [70.0, 70.02], [71.0, 71.31], [76.0, 79.42], [79.0, 79.46], [81.0, 81.01], [82.0, 82.02], [85.0, 85.65], [88.0, 88.32], [89.0, 89.87], [93.0, 93.73], [104.0, 104.16], [105.0, 106.08], [106.0, 106.88], [111.0, 112.41], [115.0, 116.02], [121.0, 121.61]], "keep_status": [true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.84, 37.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.16], ["speech", 16.41], ["echo", 9.62]], [["speech", 40.84], ["hum", 14.77], ["radio", 12.85]], null, null, null, null, null, null, null, [["music", 52.88], ["musical instrument", 7.9], ["effects unit", 5.53]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.39, 6.81, 0.63, 1.16, 0.72, 0.88, 1.12, 0.02, 0.31, 3.42, 0.46, 0.01, 0.02, 0.65, 0.32, 0.87, 0.73, 0.16, 1.08, 0.88, 1.41, 1.02, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/cvy2tRH7HNE_filtered.json b/annotations_filtered/cvy2tRH7HNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb5613462af78f993763be4b24186e942efc91b --- /dev/null +++ b/annotations_filtered/cvy2tRH7HNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 30.45], [31.0, 30.57], [31.0, 31.45], [32.0, 40.86], [42.0, 81.21]], "keep_status": [false, false, false, true, false], "silence_prob": [30.73, 0.0, 0.0, 32.69, 0.0], "audiomae_on_audioset": [[["music", 80.06], ["synthesizer", 1.94], ["scary music", 1.94]], null, null, [["music", 56.61], ["musical instrument", 5.54], ["brass instrument", 3.98]], null], "duration": [10.45, -0.43, 0.45, 8.86, 39.21]} \ No newline at end of file diff --git a/annotations_filtered/cw1dB9PxWzM_filtered.json b/annotations_filtered/cw1dB9PxWzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09c19e4a05e308583dee639cd44cecad87a1b80 --- /dev/null +++ b/annotations_filtered/cw1dB9PxWzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.08], [18.0, 19.55], [21.0, 21.74], [27.0, 29.88], [33.0, 35.16], [42.0, 42.28], [43.0, 43.92], [44.0, 46.23], [47.0, 46.85], [47.0, 50.75], [53.0, 54.3], [57.0, 57.72], [59.0, 59.26], [62.0, 64.15], [66.0, 67.53], [68.0, 69.26], [70.0, 71.0], [72.0, 74.85], [94.0, 94.71], [95.0, 96.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 92.64, 89.72, 0.0, 0.0, 67.38, 0.0, 72.01, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 1.55, 0.74, 2.88, 2.16, 0.28, 0.92, 2.23, -0.15, 3.75, 1.3, 0.72, 0.26, 2.15, 1.53, 1.26, 1.0, 2.85, 0.71, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/cwJFMjOz_l0_filtered.json b/annotations_filtered/cwJFMjOz_l0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01fd0de5dc5824731c374ddb9ab41ab368fc1012 --- /dev/null +++ b/annotations_filtered/cwJFMjOz_l0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.36], [8.0, 7.79], [8.0, 17.64], [19.0, 21.3], [22.0, 25.52], [26.0, 26.62], [29.0, 29.74], [34.0, 36.14], [37.0, 37.56], [43.0, 43.66], [45.0, 53.15], [54.0, 56.57], [59.0, 60.74], [62.0, 62.95], [64.0, 63.88], [65.0, 65.85], [69.0, 70.66], [72.0, 72.49], [75.0, 75.34], [77.0, 78.29], [79.0, 79.59], [81.0, 81.62], [83.0, 83.56], [85.0, 90.1], [90.0, 92.25], [95.0, 103.69], [105.0, 105.29], [107.0, 109.19], [111.0, 111.82], [113.0, 126.05]], "keep_status": [false, false, false, true, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 34.7, 35.39, 35.03, 0.0, 0.0, 34.6, 0.0, 0.0, 34.01, 34.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.59, 33.07, 32.58, 0.0, 32.8, 0.0, 33.11], "audiomae_on_audioset": [null, null, [["hum", 36.39], ["speech", 21.4], ["mains hum", 19.04]], [["hum", 26.86], ["speech", 9.12], ["mains hum", 8.95]], [["speech", 69.67], ["music", 6.02], ["whale vocalization", 2.95]], null, null, [["music", 38.78], ["speech", 15.75], ["didgeridoo", 7.57]], null, null, [["music", 29.11], ["speech", 20.82], ["hum", 12.28]], [["speech", 21.19], ["rumble", 13.21], ["music", 10.38]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.88], ["music", 16.16], ["hum", 6.55]], [["speech", 29.82], ["hum", 20.21], ["music", 11.35]], [["speech", 39.2], ["music", 37.69], ["hum", 4.85]], null, [["thunk", 18.59], ["fly, housefly", 17.37], ["music", 14.36]], null, [["hum", 22.56], ["speech", 22.35], ["music", 17.91]]], "duration": [1.36, -0.21, 9.64, 2.3, 3.52, 0.62, 0.74, 2.14, 0.56, 0.66, 8.15, 2.57, 1.74, 0.95, -0.12, 0.85, 1.66, 0.49, 0.34, 1.29, 0.59, 0.62, 0.56, 5.1, 2.25, 8.69, 0.29, 2.19, 0.82, 13.05]} \ No newline at end of file diff --git a/annotations_filtered/cwOh20xN82E_filtered.json b/annotations_filtered/cwOh20xN82E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3e201d29b0cb2e5803c9d82f1d81acd64b572a --- /dev/null +++ b/annotations_filtered/cwOh20xN82E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.35], [12.0, 12.28], [15.0, 15.31], [17.0, 17.07], [18.0, 18.59], [20.0, 21.41], [23.0, 25.14], [26.0, 28.76], [31.0, 31.11], [35.0, 37.79], [39.0, 39.88], [41.0, 42.33], [45.0, 46.57], [48.0, 51.54], [52.0, 54.13], [55.0, 59.14], [70.0, 71.17], [75.0, 75.41], [77.0, 78.07], [89.0, 89.99], [94.0, 95.94], [98.0, 100.74], [102.0, 105.39], [107.0, 108.01], [112.0, 117.69], [119.0, 122.47], [123.0, 127.13], [129.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, true], "silence_prob": [99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 99.48, 0.0, 93.91, 0.0, 0.0, 0.0, 95.64, 56.48, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 35.14, 33.71, 0.0, 34.17, 36.02, 35.24, 34.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.01], ["guitar", 22.42], ["musical instrument", 10.67]], null, null, null, null, null, [["music", 49.46], ["guitar", 13.03], ["musical instrument", 12.0]], [["music", 44.95], ["zither", 12.19], ["singing", 5.06]], null, [["music", 27.67], ["double bass", 21.7], ["cello", 9.52]], [["music", 32.34], ["double bass", 9.33], ["cello", 8.94]], [["music", 53.14], ["guitar", 5.76], ["double bass", 4.47]], [["music", 43.07], ["guitar", 6.69], ["musical instrument", 5.11]]], "duration": [2.35, 0.28, 0.31, 0.07, 0.59, 1.41, 2.14, 2.76, 0.11, 2.79, 0.88, 1.33, 1.57, 3.54, 2.13, 4.14, 1.17, 0.41, 1.07, 0.99, 1.94, 2.74, 3.39, 1.01, 5.69, 3.47, 4.13, 4.1]} \ No newline at end of file diff --git a/annotations_filtered/cwgaR1xDiyE_filtered.json b/annotations_filtered/cwgaR1xDiyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d224142c759d2e6956d58472d8984b46f20511 --- /dev/null +++ b/annotations_filtered/cwgaR1xDiyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.46], [14.0, 16.85], [18.0, 21.1], [24.0, 38.94], [43.0, 44.98], [47.0, 47.17], [48.0, 90.8], [92.0, 92.77], [93.0, 105.48], [110.0, 111.42], [112.0, 115.13], [119.0, 126.42]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [62.99, 52.16, 52.1, 41.74, 0.0, 0.0, 0.0, 0.0, 31.25, 0.0, 41.5, 29.55], "audiomae_on_audioset": [null, null, null, [["hum", 47.1], ["mains hum", 17.22], ["throbbing", 10.8]], null, null, null, null, [["music", 59.91], ["hum", 5.0], ["throbbing", 4.14]], null, [["music", 51.01], ["didgeridoo", 6.94], ["livestock, farm animals, working animals", 6.83]], [["speech", 34.02], ["hum", 10.64], ["music", 8.07]]], "duration": [2.46, 2.85, 3.1, 14.94, 1.98, 0.17, 42.8, 0.77, 12.48, 1.42, 3.13, 7.42]} \ No newline at end of file diff --git a/annotations_filtered/cwprGyncs0A_filtered.json b/annotations_filtered/cwprGyncs0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c93eedf99f8ca7f91155c058c46c5167a72e2ea2 --- /dev/null +++ b/annotations_filtered/cwprGyncs0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.72], [10.0, 10.94], [15.0, 16.09], [18.0, 19.16], [29.0, 29.4], [32.0, 32.9], [34.0, 35.02], [37.0, 38.37], [39.0, 40.29], [42.0, 45.27], [50.0, 50.33], [55.0, 58.7], [60.0, 62.02], [63.0, 74.43], [76.0, 86.78], [90.0, 101.19], [103.0, 103.05], [103.0, 104.03], [108.0, 107.86], [108.0, 108.57], [110.0, 114.93], [115.0, 115.2], [116.0, 116.43], [119.0, 126.99], [129.0, 129.98]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.23, 0.0, 51.28, 99.48, 35.59, 31.62, 32.58, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 31.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 64.04], ["musical instrument", 3.18], ["thunk", 1.98]], null, null, null, [["music", 63.0], ["synthesizer", 9.04], ["musical instrument", 8.41]], [["music", 32.13], ["sound effect", 7.76], ["throbbing", 7.15]], [["music", 41.26], ["speech", 24.91], ["musical instrument", 2.6]], null, null, null, null, null, null, null, [["music", 24.61], ["hum", 24.56], ["throbbing", 13.0]], null], "duration": [1.72, 0.94, 1.09, 1.16, 0.4, 0.9, 1.02, 1.37, 1.29, 3.27, 0.33, 3.7, 2.02, 11.43, 10.78, 11.19, 0.05, 1.03, -0.14, 0.57, 4.93, 0.2, 0.43, 7.99, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/cxQuvLl2E-I_filtered.json b/annotations_filtered/cxQuvLl2E-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..939af1c2dfc507db6c87e187d33c7e5374383b25 --- /dev/null +++ b/annotations_filtered/cxQuvLl2E-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.2], [8.0, 9.1], [11.0, 12.58], [14.0, 15.99], [19.0, 21.98], [22.0, 44.22], [46.0, 53.3], [56.0, 59.27], [62.0, 63.07]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 68.28, 36.26, 34.83, 75.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 30.79], ["hum", 21.14], ["speech", 20.27]], [["whale vocalization", 74.27], ["didgeridoo", 3.66], ["animal", 3.53]], null, null], "duration": [1.2, 1.1, 1.58, 1.99, 2.98, 22.22, 7.3, 3.27, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/cxRYIDsZzuE_filtered.json b/annotations_filtered/cxRYIDsZzuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e2380e8b01749490f1a4dc484bd7cd3ca5b9035 --- /dev/null +++ b/annotations_filtered/cxRYIDsZzuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 50.14], [51.0, 51.53], [53.0, 60.4], [62.0, 67.69], [69.0, 87.69], [88.0, 105.19], [106.0, 107.43], [108.0, 109.61], [111.0, 111.13]], "keep_status": [true, false, true, true, true, false, false, false, false], "silence_prob": [28.91, 0.0, 28.09, 28.11, 28.16, 28.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 42.53], ["music", 19.23], ["whack, thwack", 6.43]], null, [["livestock, farm animals, working animals", 27.97], ["cattle, bovinae", 11.55], ["moo", 9.27]], [["speech", 32.81], ["sound effect", 15.95], ["grunt", 14.39]], [["music", 46.92], ["cacophony", 7.41], ["buzz", 5.94]], [["hum", 48.18], ["mains hum", 20.95], ["throbbing", 16.29]], null, null, null], "duration": [11.14, 0.53, 7.4, 5.69, 18.69, 17.19, 1.43, 1.61, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/cxWRWbdsTjc_filtered.json b/annotations_filtered/cxWRWbdsTjc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e21ffa24749e259e594350f668975b071912307a --- /dev/null +++ b/annotations_filtered/cxWRWbdsTjc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.54], [10.0, 10.81], [11.0, 12.38], [16.0, 16.88], [17.0, 17.52], [19.0, 22.64], [26.0, 27.41], [28.0, 28.41], [32.0, 32.61], [35.0, 35.16], [38.0, 38.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.89, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [3.54, 0.81, 1.38, 0.88, 0.52, 3.64, 1.41, 0.41, 0.61, 0.16, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/cxgg3KTdRcM_filtered.json b/annotations_filtered/cxgg3KTdRcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67bed895fd45160a689b59b3bbb2e30240a1d890 --- /dev/null +++ b/annotations_filtered/cxgg3KTdRcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.84], [16.0, 16.7], [18.0, 18.99], [21.0, 22.91], [26.0, 34.67], [35.0, 62.58]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 92.8, 46.09], "audiomae_on_audioset": [null, null, null, null, null, [["music", 64.64], ["throbbing", 3.71], ["electronic music", 2.75]]], "duration": [0.84, 0.7, 0.99, 1.91, 8.67, 27.58]} \ No newline at end of file diff --git a/annotations_filtered/cy-OKLuMikk_filtered.json b/annotations_filtered/cy-OKLuMikk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..551e4040dbc113624db6783dfc47160ecc7ce81b --- /dev/null +++ b/annotations_filtered/cy-OKLuMikk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [3.0, 3.5], [5.0, 6.47], [7.0, 9.86], [10.0, 10.12], [10.0, 10.15], [11.0, 11.03], [12.0, 12.23]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.96, 0.5, 1.47, 2.86, 0.12, 0.15, 0.03, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/cy2Xj8Pz2Tk_filtered.json b/annotations_filtered/cy2Xj8Pz2Tk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a79347cf9f60d01ecc75044f88eb8c65e0570a8 --- /dev/null +++ b/annotations_filtered/cy2Xj8Pz2Tk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.16], [1.0, 6.71], [8.0, 8.99], [10.0, 11.01], [14.0, 14.44], [17.0, 17.95], [19.0, 20.83], [21.0, 20.93], [21.0, 22.05], [23.0, 25.79], [29.0, 29.98], [31.0, 30.92], [32.0, 35.13], [36.0, 36.53], [37.0, 37.74], [40.0, 40.96], [42.0, 43.34], [44.0, 56.47], [57.0, 58.04], [59.0, 61.92], [66.0, 65.74], [66.0, 66.97], [67.0, 67.83], [69.0, 69.5], [70.0, 70.51], [72.0, 71.85], [72.0, 77.8], [81.0, 83.07], [83.0, 84.54], [86.0, 99.77], [100.0, 100.11], [115.0, 115.06], [115.0, 119.96], [124.0, 128.92], [132.0, 132.76], [133.0, 145.42], [146.0, 146.53], [152.0, 153.54], [154.0, 154.23], [156.0, 155.83], [157.0, 157.4], [158.0, 159.85], [160.0, 160.91], [162.0, 161.99], [163.0, 163.49], [165.0, 186.26], [188.0, 188.52], [190.0, 190.14], [191.0, 196.64], [197.0, 196.99], [197.0, 205.04]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 31.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 0.0, 0.0, 33.57, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 58.98, 0.0, 34.84, 0.0, 0.0, 51.82, 30.85, 0.0, 33.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.27, 0.0, 0.0, 38.9, 0.0, 40.16], "audiomae_on_audioset": [null, [["noise", 22.76], ["hum", 14.16], ["whale vocalization", 13.76]], null, null, null, null, null, null, null, [["music", 20.35], ["frog", 16.45], ["speech", 8.46]], null, null, [["speech", 48.71], ["hum", 6.03], ["mains hum", 5.7]], null, null, null, null, [["speech", 44.26], ["mains hum", 7.25], ["hum", 6.88]], null, [["whale vocalization", 73.06], ["roaring cats (lions, tigers)", 6.28], ["wild animals", 5.38]], null, null, null, null, null, null, null, null, null, [["speech", 49.03], ["whimper", 5.99], ["crying, sobbing", 4.85]], null, null, null, [["music", 40.79], ["throbbing", 13.02], ["speech", 9.28]], null, [["music", 83.77], ["animal", 2.55], ["electronic music", 1.53]], null, null, null, null, null, null, null, null, null, [["speech", 28.83], ["music", 19.9], ["whack, thwack", 6.34]], null, null, [["music", 30.19], ["throbbing", 8.53], ["speech", 5.07]], null, [["music", 60.16], ["didgeridoo", 7.1], ["throbbing", 6.89]]], "duration": [0.16, 5.71, 0.99, 1.01, 0.44, 0.95, 1.83, -0.07, 1.05, 2.79, 0.98, -0.08, 3.13, 0.53, 0.74, 0.96, 1.34, 12.47, 1.04, 2.92, -0.26, 0.97, 0.83, 0.5, 0.51, -0.15, 5.8, 2.07, 1.54, 13.77, 0.11, 0.06, 4.96, 4.92, 0.76, 12.42, 0.53, 1.54, 0.23, -0.17, 0.4, 1.85, 0.91, -0.01, 0.49, 21.26, 0.52, 0.14, 5.64, -0.01, 8.04]} \ No newline at end of file diff --git a/annotations_filtered/cyEqzALZmeA_filtered.json b/annotations_filtered/cyEqzALZmeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1e58ad16c3ea86f00ae1051d914f939df70e9cf --- /dev/null +++ b/annotations_filtered/cyEqzALZmeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [13.0, 13.37], [16.0, 18.03], [21.0, 21.47], [23.0, 25.93], [27.0, 27.8], [29.0, 30.23], [36.0, 35.65], [37.0, 37.69], [39.0, 40.1], [43.0, 67.32], [79.0, 81.08], [84.0, 86.91], [94.0, 94.46], [96.0, 96.33], [108.0, 110.37], [110.0, 120.65], [122.0, 123.97], [129.0, 130.86], [138.0, 149.15], [150.0, 150.47], [151.0, 152.17], [156.0, 157.79], [158.0, 158.82], [163.0, 163.34]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.0, 0.0, 41.36, 0.0, 0.0, 0.0, 0.0, 0.0, 34.68, 32.26, 99.98, 0.0, 0.0, 61.18, 61.87, 0.0, 0.0, 53.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.93], ["saxophone", 14.26], ["brass instrument", 8.67]], null, [["music", 31.16], ["speech", 24.3], ["didgeridoo", 7.27]], null, null, null, null, null, [["music", 47.21], ["brass instrument", 16.26], ["trombone", 12.98]], [["speech", 31.92], ["music", 28.75], ["didgeridoo", 16.72]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.37, 2.03, 0.47, 2.93, 0.8, 1.23, -0.35, 0.69, 1.1, 24.32, 2.08, 2.91, 0.46, 0.33, 2.37, 10.65, 1.97, 1.86, 11.15, 0.47, 1.17, 1.79, 0.82, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/cyUf4tLI53o_filtered.json b/annotations_filtered/cyUf4tLI53o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c60a96a9c0d8ce650bf89a752ddf87a03786a5b --- /dev/null +++ b/annotations_filtered/cyUf4tLI53o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [10.0, 11.37], [12.0, 13.54], [16.0, 15.65], [17.0, 17.15], [21.0, 22.3], [29.0, 29.46], [34.0, 34.35], [35.0, 36.75], [37.0, 38.65], [39.0, 40.04], [42.0, 43.87], [45.0, 45.2], [47.0, 48.52], [49.0, 49.76], [52.0, 53.77], [54.0, 55.27], [58.0, 68.98], [69.0, 71.36], [74.0, 75.17], [76.0, 77.14], [80.0, 81.24], [86.0, 85.75], [87.0, 87.93], [89.0, 89.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.3, 32.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.11], ["theremin", 9.87], ["musical instrument", 5.69]], [["foghorn", 75.53], ["trombone", 8.8], ["music", 7.48]], null, null, null, null, null, null], "duration": [0.22, 1.37, 1.54, -0.35, 0.15, 1.3, 0.46, 0.35, 1.75, 1.65, 1.04, 1.87, 0.2, 1.52, 0.76, 1.77, 1.27, 10.98, 2.36, 1.17, 1.14, 1.24, -0.25, 0.93, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/cycPu9OddzU_filtered.json b/annotations_filtered/cycPu9OddzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..225d9105f66c4394ba9ed1a17a7b79422c01efbd --- /dev/null +++ b/annotations_filtered/cycPu9OddzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [5.0, 6.29], [7.0, 7.64], [9.0, 9.56], [10.0, 10.64], [15.0, 20.63], [27.0, 27.04], [28.0, 28.63], [31.0, 31.26], [33.0, 34.5], [36.0, 38.15], [40.0, 40.37], [42.0, 41.96], [44.0, 45.72], [48.0, 48.68], [50.0, 73.23], [74.0, 74.76], [76.0, 77.21], [80.0, 81.89], [83.0, 83.84], [85.0, 85.51], [88.0, 95.49], [96.0, 97.85], [99.0, 106.62], [107.0, 108.65], [109.0, 110.61], [111.0, 112.35], [113.0, 114.2], [115.0, 120.88], [126.0, 126.96], [129.0, 129.15], [130.0, 131.16], [133.0, 133.56], [135.0, 135.48], [136.0, 139.46], [141.0, 142.11], [143.0, 143.6], [146.0, 146.52], [149.0, 150.8], [153.0, 155.46], [157.0, 158.94], [164.0, 165.27], [166.0, 170.14], [171.0, 173.69], [174.0, 177.74], [179.0, 183.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.74, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 41.87, 0.0, 0.0, 0.0, 0.0, 38.32, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 70.86, 56.4, 47.7, 37.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.19], ["music", 15.14], ["sonar", 14.1]], null, [["gong", 32.46], ["music", 21.7], ["hum", 12.1]], null, null, null, null, [["music", 32.1], ["rumble", 10.52], ["hum", 10.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 42.4], ["speech", 24.08], ["music", 14.72]], [["speech", 68.4], ["hum", 4.27], ["rumble", 4.1]]], "duration": [2.45, 1.29, 0.64, 0.56, 0.64, 5.63, 0.04, 0.63, 0.26, 1.5, 2.15, 0.37, -0.04, 1.72, 0.68, 23.23, 0.76, 1.21, 1.89, 0.84, 0.51, 7.49, 1.85, 7.62, 1.65, 1.61, 1.35, 1.2, 5.88, 0.96, 0.15, 1.16, 0.56, 0.48, 3.46, 1.11, 0.6, 0.52, 1.8, 2.46, 1.94, 1.27, 4.14, 2.69, 3.74, 4.03]} \ No newline at end of file diff --git a/annotations_filtered/cypqB_GKzjA_filtered.json b/annotations_filtered/cypqB_GKzjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4ab8848a63f793d3132fe8ecc52fc767f607806 --- /dev/null +++ b/annotations_filtered/cypqB_GKzjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [5.0, 6.03], [14.0, 14.27], [19.0, 18.94], [21.0, 23.58], [27.0, 27.92], [29.0, 29.13], [40.0, 40.98], [44.0, 44.81], [45.0, 45.86], [47.0, 48.49], [59.0, 58.87], [68.0, 70.01], [72.0, 73.74], [74.0, 75.39], [94.0, 94.63], [97.0, 97.04], [101.0, 102.39], [104.0, 104.09], [107.0, 108.53], [110.0, 111.28], [114.0, 119.31], [121.0, 126.87], [128.0, 128.26], [139.0, 140.26], [143.0, 143.56], [144.0, 150.85], [152.0, 152.64], [153.0, 164.27], [165.0, 166.65], [167.0, 169.13], [170.0, 170.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 52.16, 0.0, 0.0, 0.0, 63.96, 0.0, 57.72, 0.0, 63.85, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 42.07], ["music", 24.03], ["crow", 5.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.89, 1.03, 0.27, -0.06, 2.58, 0.92, 0.13, 0.98, 0.81, 0.86, 1.49, -0.13, 2.01, 1.74, 1.39, 0.63, 0.04, 1.39, 0.09, 1.53, 1.28, 5.31, 5.87, 0.26, 1.26, 0.56, 6.85, 0.64, 11.27, 1.65, 2.13, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/cz1TJ4r7bOU_filtered.json b/annotations_filtered/cz1TJ4r7bOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fbc6bc31448c9c277e511247467e8d51f3f4ddf --- /dev/null +++ b/annotations_filtered/cz1TJ4r7bOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.85], [14.0, 14.79], [16.0, 18.89], [20.0, 29.46], [29.0, 29.49], [30.0, 29.52], [30.0, 29.94], [30.0, 30.08], [30.0, 30.11], [30.0, 30.28], [30.0, 30.32], [30.0, 30.35], [30.0, 30.38], [30.0, 30.42], [30.0, 30.45], [31.0, 30.55], [31.0, 30.59], [31.0, 30.62], [31.0, 30.65], [31.0, 30.69], [31.0, 32.51], [34.0, 34.5], [35.0, 40.12], [41.0, 46.99], [48.0, 49.99], [51.0, 54.94], [55.0, 55.05], [55.0, 60.2], [63.0, 65.26], [71.0, 72.2], [73.0, 89.97], [90.0, 92.43], [95.0, 96.9], [97.0, 98.04], [99.0, 101.02], [105.0, 110.73], [112.0, 114.45], [117.0, 120.83], [121.0, 123.18], [123.0, 124.75], [127.0, 128.01], [129.0, 130.57], [132.0, 134.52], [135.0, 137.22], [138.0, 139.65], [141.0, 141.89], [143.0, 146.58], [147.0, 149.15], [150.0, 152.78], [153.0, 156.83], [161.0, 161.2], [164.0, 167.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, false, true, true, false, false, true, true, true, true, false, false], "silence_prob": [35.32, 0.0, 37.62, 34.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.07, 35.5, 0.0, 35.83, 0.0, 32.51, 34.6, 0.0, 31.08, 34.52, 0.0, 0.0, 37.77, 32.53, 35.87, 35.11, 35.0, 0.0, 0.0, 0.0, 38.46, 37.85, 0.0, 0.0, 37.08, 33.63, 35.28, 35.53, 0.0, 35.8], "audiomae_on_audioset": [[["hum", 29.51], ["mains hum", 21.32], ["music", 15.02]], null, [["mains hum", 65.25], ["hum", 21.8], ["music", 4.47]], [["music", 50.35], ["theremin", 23.36], ["musical instrument", 3.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 28.16], ["music", 20.37], ["hum", 12.44]], [["music", 70.09], ["theremin", 12.23], ["musical instrument", 2.76]], null, [["music", 57.27], ["theremin", 10.31], ["hum", 6.18]], null, [["theremin", 31.66], ["music", 28.95], ["speech", 12.93]], [["music", 40.63], ["flute", 22.67], ["wind instrument, woodwind instrument", 13.98]], null, [["music", 84.95], ["theremin", 2.6], ["electronic music", 2.4]], [["music", 13.99], ["dog", 11.43], ["speech", 10.65]], null, null, [["music", 24.23], ["speech", 8.44], ["musical instrument", 8.29]], [["music", 48.65], ["theremin", 9.42], ["musical instrument", 8.51]], [["music", 46.74], ["didgeridoo", 6.47], ["buzz", 4.53]], [["music", 64.3], ["musical instrument", 7.47], ["mains hum", 4.35]], [["mains hum", 32.09], ["hum", 29.34], ["music", 11.09]], null, null, null, [["music", 21.49], ["toothbrush", 8.62], ["speech", 8.36]], [["speech", 30.04], ["music", 18.77], ["mains hum", 13.65]], null, null, [["music", 48.6], ["speech", 9.06], ["musical instrument", 5.41]], [["music", 29.83], ["mains hum", 12.95], ["didgeridoo", 10.17]], [["music", 31.25], ["mains hum", 6.25], ["hum", 4.6]], [["speech", 29.23], ["music", 18.02], ["theremin", 13.48]], null, [["music", 62.11], ["didgeridoo", 4.94], ["theremin", 4.63]]], "duration": [7.85, 0.79, 2.89, 9.46, 0.49, -0.48, -0.06, 0.08, 0.11, 0.28, 0.32, 0.35, 0.38, 0.42, 0.45, -0.45, -0.41, -0.38, -0.35, -0.31, 1.51, 0.5, 5.12, 5.99, 1.99, 3.94, 0.05, 5.2, 2.26, 1.2, 16.97, 2.43, 1.9, 1.04, 2.02, 5.73, 2.45, 3.83, 2.18, 1.75, 1.01, 1.57, 2.52, 2.22, 1.65, 0.89, 3.58, 2.15, 2.78, 3.83, 0.2, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/czBTbtS1YpE_filtered.json b/annotations_filtered/czBTbtS1YpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdbf9bce115850b7aff68c8a5762b533bed767ed --- /dev/null +++ b/annotations_filtered/czBTbtS1YpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [9.0, 11.53], [13.0, 13.83], [15.0, 16.41], [17.0, 17.9], [18.0, 18.52], [21.0, 21.36], [23.0, 27.55], [28.0, 29.34], [30.0, 32.04], [33.0, 34.57], [35.0, 36.05], [36.0, 39.28], [42.0, 44.1], [48.0, 50.06], [55.0, 55.11], [59.0, 62.21], [63.0, 64.96], [66.0, 86.39], [87.0, 87.88], [89.0, 89.8], [91.0, 99.12]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 42.6, 0.0, 0.0, 0.0, 0.0, 0.0, 36.7, 0.0, 37.97, 0.0, 0.0, 45.98, 31.22, 32.15, 0.0, 31.35, 0.0, 32.17, 0.0, 0.0, 30.99], "audiomae_on_audioset": [null, [["music", 20.1], ["dog", 11.67], ["hum", 10.6]], null, null, null, null, null, [["mains hum", 36.6], ["music", 21.61], ["hum", 14.65]], null, [["cattle, bovinae", 23.19], ["music", 18.33], ["livestock, farm animals, working animals", 14.34]], null, null, [["speech", 22.17], ["music", 12.3], ["musical instrument", 5.24]], [["speech", 52.34], ["music", 7.29], ["thunk", 3.33]], [["music", 61.01], ["didgeridoo", 5.78], ["musical instrument", 3.93]], null, [["music", 32.59], ["speech", 26.56], ["throbbing", 5.99]], null, [["music", 63.68], ["sidetone", 4.48], ["synthesizer", 4.03]], null, null, [["music", 44.61], ["speech", 44.1], ["breaking", 2.93]]], "duration": [0.89, 2.53, 0.83, 1.41, 0.9, 0.52, 0.36, 4.55, 1.34, 2.04, 1.57, 1.05, 3.28, 2.1, 2.06, 0.11, 3.21, 1.96, 20.39, 0.88, 0.8, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/czJL-TPz-5M_filtered.json b/annotations_filtered/czJL-TPz-5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f768e6c85dd5f9832b9a9283505d9c8fbf50ae26 --- /dev/null +++ b/annotations_filtered/czJL-TPz-5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.82], [19.0, 25.2], [26.0, 39.51], [40.0, 64.12], [64.0, 64.17], [67.0, 67.66], [72.0, 72.22], [73.0, 75.2], [86.0, 90.1], [92.0, 93.21], [94.0, 94.54], [95.0, 95.23], [95.0, 95.3], [95.0, 95.34], [95.0, 95.49], [96.0, 96.65], [99.0, 115.28], [115.0, 115.32], [115.0, 115.35], [115.0, 115.38], [115.0, 115.42], [115.0, 115.45], [115.0, 121.44], [123.0, 124.34], [126.0, 127.08], [129.0, 129.63], [131.0, 131.53], [134.0, 135.57], [138.0, 138.96], [140.0, 145.34], [146.0, 146.42], [147.0, 152.1], [156.0, 165.97], [166.0, 166.33], [170.0, 170.4], [174.0, 175.17]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.53, 62.78, 82.97, 71.43, 0.0, 0.0, 0.0, 38.94, 40.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 85.54, 83.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 31.09], ["music", 17.19], ["grunt", 5.34]], [["music", 22.82], ["speech", 5.52], ["electric shaver, electric razor", 4.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.82, 6.2, 13.51, 24.12, 0.17, 0.66, 0.22, 2.2, 4.1, 1.21, 0.54, 0.23, 0.3, 0.34, 0.49, 0.65, 16.28, 0.32, 0.35, 0.38, 0.42, 0.45, 6.44, 1.34, 1.08, 0.63, 0.53, 1.57, 0.96, 5.34, 0.42, 5.1, 9.97, 0.33, 0.4, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/czOgJJqehv0_filtered.json b/annotations_filtered/czOgJJqehv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..820fcfd2fadba0466fc47bdaa03643800f8be288 --- /dev/null +++ b/annotations_filtered/czOgJJqehv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.36], [21.0, 21.14], [24.0, 25.0], [33.0, 33.88], [34.0, 34.62], [36.0, 35.99], [44.0, 45.03], [47.0, 48.12]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.36, 0.14, 1.0, 0.88, 0.62, -0.01, 1.03, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/czU3M9Ye268_filtered.json b/annotations_filtered/czU3M9Ye268_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63418adb6395be6333c5794965682affb3159513 --- /dev/null +++ b/annotations_filtered/czU3M9Ye268_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [7.0, 11.52], [14.0, 14.71], [15.0, 18.62], [19.0, 20.34], [21.0, 32.64], [39.0, 38.94], [40.0, 43.12], [43.0, 43.23], [44.0, 44.79], [46.0, 47.78], [53.0, 54.38], [57.0, 58.56], [60.0, 59.95], [63.0, 66.09], [69.0, 71.07], [74.0, 74.83], [76.0, 89.83], [92.0, 93.9], [95.0, 96.57], [98.0, 109.58]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.53, 0.0, 31.89, 0.0, 34.14, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.95, 0.0, 96.17, 0.0, 0.0, 61.27], "audiomae_on_audioset": [null, [["music", 64.0], ["hum", 10.41], ["mains hum", 3.59]], null, [["cowbell", 31.81], ["music", 25.85], ["sidetone", 5.95]], null, [["music", 49.69], ["speech", 11.64], ["hum", 3.5]], null, [["cowbell", 72.32], ["cattle, bovinae", 8.6], ["music", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 4.52, 0.71, 3.62, 1.34, 11.64, -0.06, 3.12, 0.23, 0.79, 1.78, 1.38, 1.56, -0.05, 3.09, 2.07, 0.83, 13.83, 1.9, 1.57, 11.58]} \ No newline at end of file diff --git a/annotations_filtered/czzH5M2bUYc_filtered.json b/annotations_filtered/czzH5M2bUYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a9140b39e7d0c9a8d1ed01845f641a9fce537ab --- /dev/null +++ b/annotations_filtered/czzH5M2bUYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [8.0, 8.68], [11.0, 11.47], [15.0, 17.37], [18.0, 19.21], [20.0, 20.12], [21.0, 22.1], [23.0, 24.65], [25.0, 26.55], [29.0, 50.48], [52.0, 67.26], [75.0, 78.29], [79.0, 94.07], [97.0, 100.7], [101.0, 104.67]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 37.74, 0.0, 0.0, 0.0, 0.0, 0.0, 39.25, 35.35, 34.0, 34.68, 53.72, 33.29], "audiomae_on_audioset": [null, null, null, [["theremin", 65.17], ["music", 14.85], ["didgeridoo", 2.84]], null, null, null, null, null, [["music", 43.03], ["sitar", 9.7], ["musical instrument", 8.88]], [["music", 55.37], ["sitar", 14.77], ["carnatic music", 9.53]], [["music", 70.62], ["musical instrument", 12.08], ["carnatic music", 3.29]], [["music", 57.72], ["carnatic music", 11.37], ["musical instrument", 7.72]], null, [["croak", 11.69], ["speech", 11.26], ["frog", 9.07]]], "duration": [1.25, 0.68, 0.47, 2.37, 1.21, 0.12, 1.1, 1.65, 1.55, 21.48, 15.26, 3.29, 15.07, 3.7, 3.67]} \ No newline at end of file