Spaces:
Build error
Build error
Adding files 1
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- annotations_1/--ABd2SeIGE_filtered.json +1 -0
- annotations_1/--QCZKgJt6o_filtered.json +1 -0
- annotations_1/--hendERqm0_filtered.json +1 -0
- annotations_1/-0SHIbuEO3w_filtered.json +1 -0
- annotations_1/-19d_T472co_filtered.json +1 -0
- annotations_1/-1W4xHNKvAk_filtered.json +1 -0
- annotations_1/-1eKufUP5XQ_filtered.json +1 -0
- annotations_1/-1zLU5N6uBU_filtered.json +1 -0
- annotations_1/-2KG4lLGEl0_filtered.json +1 -0
- annotations_1/-2KGPYEFnsU_filtered.json +1 -0
- annotations_1/-2QFIXEHnOY_filtered.json +1 -0
- annotations_1/-5twCD8tAMc_filtered.json +1 -0
- annotations_1/-7-2-088LnM_filtered.json +1 -0
- annotations_1/-7Sow81yi24_filtered.json +1 -0
- annotations_1/-7cV5cWQmxg_filtered.json +1 -0
- annotations_1/-7mzQx0ebqk_filtered.json +1 -0
- annotations_1/-8ajIeIeJpY_filtered.json +1 -0
- annotations_1/-AZg55qXj7U_filtered.json +1 -0
- annotations_1/-BgZFaMJRxM_filtered.json +1 -0
- annotations_1/-CSIqCS1WIk_filtered.json +1 -0
- annotations_1/-DXQJLwDAwg_filtered.json +1 -0
- annotations_1/-DXU2ZHuiTs_filtered.json +1 -0
- annotations_1/-DqmTaUK-Ow_filtered.json +1 -0
- annotations_1/-FQOaUEE69I_filtered.json +1 -0
- annotations_1/-FU65KX7aJs_filtered.json +1 -0
- annotations_1/-G7OPYUlnT0_filtered.json +1 -0
- annotations_1/-H6l6-_elF0_filtered.json +1 -0
- annotations_1/-IV-ZZwXUkw_filtered.json +1 -0
- annotations_1/-JNyHnAi8zk_filtered.json +1 -0
- annotations_1/-Jf-E7oEguU_filtered.json +1 -0
- annotations_1/-JhNO_E3aEE_filtered.json +1 -0
- annotations_1/-KVNfZo-cfc_filtered.json +1 -0
- annotations_1/-KW0wz1xBfw_filtered.json +1 -0
- annotations_1/-Koj9hvcBMk_filtered.json +1 -0
- annotations_1/-Kztqrjp2yw_filtered.json +1 -0
- annotations_1/-LCqZeb1de0_filtered.json +1 -0
- annotations_1/-Lrndfrc9yU_filtered.json +1 -0
- annotations_1/-MNpOKICOx8_filtered.json +1 -0
- annotations_1/-Nzbwerwks8_filtered.json +1 -0
- annotations_1/-OMiOIbouaA_filtered.json +1 -0
- annotations_1/-ON8ZTCiuYo_filtered.json +1 -0
- annotations_1/-OUuZojE3aM_filtered.json +1 -0
- annotations_1/-QT_Af7RLjU_filtered.json +1 -0
- annotations_1/-QZzReak2Ck_filtered.json +1 -0
- annotations_1/-QfKnft9uWY_filtered.json +1 -0
- annotations_1/-Qq6ZZy0yGg_filtered.json +1 -0
- annotations_1/-SkeK7t74oo_filtered.json +1 -0
- annotations_1/-Svsz19yyPM_filtered.json +1 -0
- annotations_1/-U9v7Nz6hOs_filtered.json +1 -0
- annotations_1/-VnQ_KpOBm4_filtered.json +1 -0
annotations_1/--ABd2SeIGE_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 12.75], [15.0, 23.94], [27.0, 37.12], [48.0, 47.83], [51.0, 51.43], [60.0, 60.0], [62.0, 69.42], [86.0, 86.32], [93.0, 96.79], [98.0, 98.36], [99.0, 99.6], [100.0, 102.39], [106.0, 113.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.94, 30.17, 46.33, 0.0, 0.0, 0.0, 68.15, 0.0, 61.97, 0.0, 0.0, 38.33, 39.55], "audiomae_on_audioset": [[["theremin", 29.79], ["music", 28.67], ["hum", 7.9]], [["speech", 57.27], ["explosion", 14.36], ["burst, pop", 7.06]], [["music", 62.43], ["theremin", 8.26], ["cello", 4.68]], null, null, null, null, null, null, null, null, [["music", 21.78], ["musical instrument", 6.05], ["didgeridoo", 5.51]], [["music", 76.58], ["musical instrument", 3.22], ["theremin", 2.27]]], "duration": [4.75, 8.94, 10.12, -0.17, 0.43, 0.0, 7.42, 0.32, 3.79, 0.36, 0.6, 2.39, 7.46]}
|
annotations_1/--QCZKgJt6o_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 3.3], [5.0, 6.37], [7.0, 9.76], [14.0, 16.93], [30.0, 31.36], [33.0, 33.54], [35.0, 35.72], [40.0, 46.94], [51.0, 50.68], [52.0, 61.47], [67.0, 69.9], [77.0, 77.35], [107.0, 108.08], [117.0, 117.19], [117.0, 118.18], [127.0, 128.22], [133.0, 134.74], [136.0, 136.24], [140.0, 142.8], [146.0, 149.35], [151.0, 151.31], [152.0, 153.35], [156.0, 156.61], [157.0, 159.6], [164.0, 165.43], [174.0, 175.02]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 60.89, 45.59, 0.0, 0.0, 0.0, 35.85, 0.0, 34.71, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 47.2, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.24], ["vocal music", 7.63], ["singing", 6.21]], null, null, null, [["speech", 18.36], ["moo", 9.75], ["livestock, farm animals, working animals", 8.42]], null, [["chant", 14.05], ["cattle, bovinae", 12.42], ["grunt", 10.88]], null, null, null, null, null, null, null, null, null, [["speech", 49.28], ["hum", 8.71], ["music", 5.69]], null, null, null, [["speech", 31.98], ["music", 6.36], ["hum", 5.44]], null, null], "duration": [1.3, 1.37, 2.76, 2.93, 1.36, 0.54, 0.72, 6.94, -0.32, 9.47, 2.9, 0.35, 1.08, 0.19, 1.18, 1.22, 1.74, 0.24, 2.8, 3.35, 0.31, 1.35, 0.61, 2.6, 1.43, 1.02]}
|
annotations_1/--hendERqm0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[12.0, 12.56], [14.0, 14.22], [16.0, 21.17], [28.0, 28.76], [32.0, 32.95], [34.0, 34.42], [36.0, 36.15], [38.0, 38.06], [40.0, 40.63], [41.0, 51.34], [53.0, 56.84], [58.0, 59.12], [61.0, 62.31], [66.0, 67.93], [70.0, 71.29], [74.0, 74.75], [77.0, 78.38], [82.0, 84.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.77, 31.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95], "audiomae_on_audioset": [null, null, [["music", 67.55], ["electronic music", 5.78], ["house music", 4.08]], null, null, null, null, null, null, [["music", 45.64], ["speech", 12.16], ["techno", 9.56]], [["music", 51.69], ["speech", 33.92], ["drum machine", 1.58]], null, null, null, null, null, null, [["music", 30.48], ["sonar", 30.27], ["electronic music", 9.0]]], "duration": [0.56, 0.22, 5.17, 0.76, 0.95, 0.42, 0.15, 0.06, 0.63, 10.34, 3.84, 1.12, 1.31, 1.93, 1.29, 0.75, 1.38, 2.72]}
|
annotations_1/-0SHIbuEO3w_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[56.0, 60.72], [63.0, 122.66], [127.0, 131.94]], "keep_status": [false, false, true], "silence_prob": [29.36, 0.0, 30.22], "audiomae_on_audioset": [[["music", 65.38], ["speech", 7.81], ["throbbing", 3.28]], null, [["speech", 22.67], ["music", 22.28], ["crowd", 5.83]]], "duration": [4.72, 59.66, 4.94]}
|
annotations_1/-19d_T472co_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 47.21], [48.0, 48.57], [53.0, 53.25], [53.0, 166.8], [167.0, 167.7], [168.0, 173.04], [175.0, 177.45], [180.0, 201.29], [205.0, 205.17], [206.0, 212.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 31.68, 35.71, 0.0, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 76.85], ["speech", 5.82], ["boing", 1.78]], [["music", 32.21], ["fly, housefly", 10.63], ["buzz", 6.42]], null, null], "duration": [46.21, 0.57, 0.25, 113.8, 0.7, 5.04, 2.45, 21.29, 0.17, 6.75]}
|
annotations_1/-1W4xHNKvAk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[7.0, 7.62], [16.0, 17.51], [35.0, 35.06], [36.0, 36.69], [50.0, 51.21], [52.0, 53.15], [73.0, 74.11], [85.0, 86.86], [100.0, 101.07], [102.0, 103.08], [114.0, 115.01], [117.0, 117.29], [120.0, 120.75], [135.0, 134.97], [150.0, 150.13], [208.0, 208.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.51, 0.06, 0.69, 1.21, 1.15, 1.11, 1.86, 1.07, 1.08, 1.01, 0.29, 0.75, -0.03, 0.13, 0.63]}
|
annotations_1/-1eKufUP5XQ_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[5.0, 5.29], [11.0, 15.52], [20.0, 20.07], [24.0, 24.58], [40.0, 41.15], [44.0, 49.44], [50.0, 51.68], [53.0, 59.09], [64.0, 64.49], [65.0, 65.69], [66.0, 68.1], [79.0, 79.39], [80.0, 80.59], [83.0, 84.33], [89.0, 89.85], [91.0, 97.97], [99.0, 99.39], [100.0, 99.98], [100.0, 102.0], [104.0, 104.41], [105.0, 105.73], [106.0, 106.74], [107.0, 107.97], [110.0, 111.35], [112.0, 113.56], [114.0, 115.64], [116.0, 118.37], [119.0, 123.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.9, 0.0, 0.0, 0.0, 90.25, 0.0, 89.72, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 94.66], "audiomae_on_audioset": [null, [["speech", 27.69], ["whack, thwack", 9.37], ["busy signal", 8.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 4.52, 0.07, 0.58, 1.15, 5.44, 1.68, 6.09, 0.49, 0.69, 2.1, 0.39, 0.59, 1.33, 0.85, 6.97, 0.39, -0.02, 2.0, 0.41, 0.73, 0.74, 0.97, 1.35, 1.56, 1.64, 2.37, 4.13]}
|
annotations_1/-1zLU5N6uBU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
|
annotations_1/-2KG4lLGEl0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[13.0, 13.27], [14.0, 15.26], [21.0, 21.66], [27.0, 27.48], [31.0, 32.09], [34.0, 34.03], [34.0, 34.96], [36.0, 36.54], [38.0, 39.01], [41.0, 42.52], [43.0, 43.6], [46.0, 46.41], [47.0, 49.2], [51.0, 51.33], [54.0, 55.85], [57.0, 58.55], [68.0, 68.88], [79.0, 79.73], [80.0, 80.94], [84.0, 84.54], [87.0, 87.52], [89.0, 90.24], [101.0, 101.85], [105.0, 105.51], [109.0, 109.65], [111.0, 112.77], [116.0, 116.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 1.26, 0.66, 0.48, 1.09, 0.03, 0.96, 0.54, 1.01, 1.52, 0.6, 0.41, 2.2, 0.33, 1.85, 1.55, 0.88, 0.73, 0.94, 0.54, 0.52, 1.24, 0.85, 0.51, 0.65, 1.77, 0.92]}
|
annotations_1/-2KGPYEFnsU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[14.0, 14.39], [15.0, 16.73], [17.0, 17.9], [19.0, 20.11], [24.0, 24.53], [25.0, 25.76], [29.0, 33.12], [38.0, 39.55], [41.0, 43.04], [44.0, 44.71], [46.0, 47.39], [50.0, 50.03], [52.0, 53.38], [55.0, 56.1], [59.0, 60.71], [66.0, 66.9], [73.0, 73.94], [78.0, 78.9], [81.0, 80.79], [110.0, 110.1], [116.0, 117.9], [120.0, 119.8], [125.0, 127.04], [129.0, 129.41], [132.0, 132.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.73, 0.9, 1.11, 0.53, 0.76, 4.12, 1.55, 2.04, 0.71, 1.39, 0.03, 1.38, 1.1, 1.71, 0.9, 0.94, 0.9, -0.21, 0.1, 1.9, -0.2, 2.04, 0.41, 0.97]}
|
annotations_1/-2QFIXEHnOY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 16.11], [19.0, 22.35], [24.0, 31.28], [33.0, 33.39], [34.0, 58.75], [59.0, 68.89]], "keep_status": [true, true, true, false, true, true], "silence_prob": [29.59, 29.9, 28.84, 0.0, 29.2, 29.4], "audiomae_on_audioset": [[["music", 34.03], ["buzz", 18.87], ["hum", 9.34]], [["hum", 17.0], ["mains hum", 12.84], ["throbbing", 7.47]], [["fly, housefly", 16.88], ["buzz", 13.34], ["mosquito", 12.24]], null, [["buzz", 13.81], ["hum", 12.07], ["electric shaver, electric razor", 6.64]], [["hum", 22.83], ["mains hum", 10.69], ["fly, housefly", 8.24]]], "duration": [10.11, 3.35, 7.28, 0.39, 24.75, 9.89]}
|
annotations_1/-5twCD8tAMc_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 23.65], [25.0, 25.08], [27.0, 28.24], [29.0, 30.91], [35.0, 35.61], [38.0, 42.33], [44.0, 75.29], [76.0, 76.72], [81.0, 89.38]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [33.09, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 30.12], "audiomae_on_audioset": [[["music", 83.83], ["theremin", 1.62], ["synthesizer", 1.3]], null, null, null, null, [["boat, water vehicle", 16.83], ["music", 14.4], ["vehicle", 11.07]], null, null, [["music", 72.52], ["musical instrument", 4.87], ["cacophony", 2.86]]], "duration": [15.65, 0.08, 1.24, 1.91, 0.61, 4.33, 31.29, 0.72, 8.38]}
|
annotations_1/-7-2-088LnM_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[22.0, 22.2], [23.0, 22.92], [23.0, 25.52], [28.0, 30.13], [35.0, 36.71], [40.0, 42.08], [44.0, 45.2], [45.0, 46.09], [46.0, 48.91], [49.0, 49.25], [50.0, 50.72], [51.0, 52.47], [53.0, 57.54], [59.0, 67.63], [70.0, 72.08], [72.0, 74.56], [82.0, 82.93], [87.0, 99.28], [99.0, 99.5], [100.0, 100.01], [100.0, 100.45], [101.0, 109.46]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.47, 36.04, 0.0, 97.11, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 71.14, 67.63, 98.99, 43.85, 0.0, 37.46, 0.0, 0.0, 0.0, 42.74], "audiomae_on_audioset": [null, null, [["whale vocalization", 16.24], ["boing", 16.19], ["moo", 10.98]], [["speech", 72.48], ["applause", 5.84], ["radio", 2.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.7], ["burping, eructation", 2.31], ["percussion", 1.49]], null, [["music", 60.25], ["groan", 6.88], ["grunt", 5.85]], null, null, null, [["gasp", 19.11], ["speech", 13.68], ["breaking", 11.58]]], "duration": [0.2, -0.08, 2.52, 2.13, 1.71, 2.08, 1.2, 1.09, 2.91, 0.25, 0.72, 1.47, 4.54, 8.63, 2.08, 2.56, 0.93, 12.28, 0.5, 0.01, 0.45, 8.46]}
|
annotations_1/-7Sow81yi24_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[32.0, 32.53], [33.0, 38.33], [40.0, 42.58], [44.0, 45.69], [47.0, 63.64], [64.0, 66.07], [67.0, 73.43], [75.0, 76.65], [77.0, 79.95], [81.0, 84.52], [86.0, 89.21], [94.0, 96.35], [100.0, 101.29], [102.0, 103.87], [107.0, 107.33], [109.0, 110.39], [114.0, 124.66]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 49.92, 54.9, 0.0, 47.94, 35.61, 38.42, 0.0, 43.15, 38.54, 36.11, 45.14, 0.0, 0.0, 0.0, 0.0, 28.26], "audiomae_on_audioset": [null, [["music", 25.69], ["hum", 11.38], ["speech", 11.19]], null, null, [["hum", 39.29], ["mains hum", 20.44], ["music", 15.13]], [["gong", 43.33], ["hum", 9.03], ["singing bowl", 6.05]], [["hum", 50.46], ["throbbing", 24.51], ["mains hum", 10.71]], null, [["music", 41.92], ["mains hum", 17.04], ["hum", 14.08]], [["music", 40.52], ["mains hum", 12.71], ["hum", 12.62]], [["hum", 25.29], ["music", 24.57], ["mains hum", 18.16]], [["music", 60.94], ["theremin", 7.71], ["musical instrument", 3.84]], null, null, null, null, [["music", 56.16], ["vehicle", 7.08], ["car", 4.84]]], "duration": [0.53, 5.33, 2.58, 1.69, 16.64, 2.07, 6.43, 1.65, 2.95, 3.52, 3.21, 2.35, 1.29, 1.87, 0.33, 1.39, 10.66]}
|
annotations_1/-7cV5cWQmxg_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 6.34], [8.0, 8.5], [9.0, 9.83], [17.0, 18.98], [21.0, 21.37], [22.0, 23.33], [27.0, 28.56], [32.0, 33.91], [34.0, 38.38], [39.0, 40.36], [42.0, 61.25], [64.0, 66.39], [68.0, 73.47], [80.0, 79.89], [80.0, 80.2], [88.0, 94.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.01, 0.0, 41.98, 94.81, 37.09, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 28.43], ["music", 28.37], ["synthesizer", 5.19]], null, [["mosquito", 27.65], ["fly, housefly", 20.31], ["insect", 8.7]], null, [["speech", 72.72], ["stomach rumble", 4.04], ["animal", 2.28]], null, null, [["speech", 19.75], ["music", 18.08], ["throbbing", 13.72]]], "duration": [0.34, 0.5, 0.83, 1.98, 0.37, 1.33, 1.56, 1.91, 4.38, 1.36, 19.25, 2.39, 5.47, -0.11, 0.2, 6.09]}
|
annotations_1/-7mzQx0ebqk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 3.64], [10.0, 10.27], [14.0, 14.88], [19.0, 20.17], [23.0, 23.01], [24.0, 28.61], [32.0, 34.43], [43.0, 43.29], [45.0, 45.52], [49.0, 49.55], [54.0, 54.06], [62.0, 63.85], [65.0, 72.45], [75.0, 79.84], [82.0, 82.54], [86.0, 89.4], [96.0, 97.44], [98.0, 100.3], [126.0, 125.73], [128.0, 127.7], [131.0, 132.16], [133.0, 133.22], [135.0, 136.95], [141.0, 141.61], [144.0, 143.95], [145.0, 148.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 60.05, 0.0, 94.22, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7], "audiomae_on_audioset": [null, null, null, null, null, [["singing bowl", 23.82], ["music", 21.45], ["burping, eructation", 15.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.27, 0.88, 1.17, 0.01, 4.61, 2.43, 0.29, 0.52, 0.55, 0.06, 1.85, 7.45, 4.84, 0.54, 3.4, 1.44, 2.3, -0.27, -0.3, 1.16, 0.22, 1.95, 0.61, -0.05, 3.66]}
|
annotations_1/-8ajIeIeJpY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 0.89], [3.0, 5.76], [6.0, 6.86], [8.0, 8.73], [14.0, 15.4], [19.0, 19.99], [22.0, 23.03], [24.0, 24.53], [26.0, 26.33], [34.0, 33.86], [35.0, 35.43], [36.0, 36.31], [37.0, 37.89], [38.0, 39.29], [42.0, 43.29], [44.0, 44.58], [45.0, 45.4], [46.0, 46.4], [48.0, 48.32], [57.0, 57.15], [58.0, 59.56], [60.0, 61.32], [63.0, 63.66], [68.0, 68.47], [74.0, 76.0], [77.0, 78.85], [81.0, 85.8], [86.0, 86.41], [89.0, 90.75], [91.0, 91.93], [92.0, 92.62], [93.0, 93.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.69], ["radio", 21.67], ["croak", 11.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 2.76, 0.86, 0.73, 1.4, 0.99, 1.03, 0.53, 0.33, -0.14, 0.43, 0.31, 0.89, 1.29, 1.29, 0.58, 0.4, 0.4, 0.32, 0.15, 1.56, 1.32, 0.66, 0.47, 2.0, 1.85, 4.8, 0.41, 1.75, 0.93, 0.62, 0.85]}
|
annotations_1/-AZg55qXj7U_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[4.0, 4.62], [6.0, 61.82], [62.0, 86.7], [88.0, 106.52], [109.0, 152.19], [153.0, 178.44]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.0, 31.48, 0.0, 33.88], "audiomae_on_audioset": [null, null, [["music", 83.76], ["hum", 7.02], ["throbbing", 1.65]], [["music", 65.55], ["synthesizer", 5.15], ["hum", 4.37]], null, [["music", 22.0], ["hum", 20.87], ["speech", 11.7]]], "duration": [0.62, 55.82, 24.7, 18.52, 43.19, 25.44]}
|
annotations_1/-BgZFaMJRxM_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 5.34], [7.0, 7.79], [9.0, 10.56], [15.0, 17.19], [17.0, 18.17], [19.0, 19.72], [21.0, 23.97], [25.0, 28.31], [30.0, 32.85], [43.0, 43.6], [45.0, 45.55], [48.0, 52.08], [56.0, 61.15], [64.0, 65.4], [67.0, 68.32], [69.0, 69.89], [70.0, 72.89], [74.0, 77.5], [81.0, 83.39], [84.0, 104.89], [106.0, 106.46], [107.0, 108.24], [110.0, 111.57], [115.0, 116.75], [120.0, 120.61], [123.0, 124.21], [126.0, 127.99], [130.0, 131.03], [132.0, 134.27], [135.0, 135.68], [136.0, 137.03], [139.0, 141.13], [142.0, 142.92], [146.0, 145.71], [146.0, 147.06], [149.0, 149.44], [152.0, 156.36], [162.0, 163.31], [164.0, 165.11], [168.0, 168.91], [174.0, 174.97], [175.0, 176.34], [177.0, 178.58], [180.0, 179.91]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.75, 0.0, 0.0, 47.98, 0.0, 0.0, 54.43, 50.51, 56.25, 0.0, 0.0, 57.32, 61.67, 0.0, 0.0, 0.0, 39.86, 58.55, 52.51, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["chirp tone", 24.02], ["whale vocalization", 16.52], ["sine wave", 16.23]], null, null, [["music", 31.28], ["whale vocalization", 20.69], ["singing bowl", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.97], ["whale vocalization", 14.45], ["hum", 11.47]], null, null, [["hum", 47.44], ["throbbing", 31.47], ["mains hum", 6.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.27], ["mains hum", 24.35], ["speech", 22.56]], null, null, null, null, null, null, null], "duration": [3.34, 0.79, 1.56, 2.19, 1.17, 0.72, 2.97, 3.31, 2.85, 0.6, 0.55, 4.08, 5.15, 1.4, 1.32, 0.89, 2.89, 3.5, 2.39, 20.89, 0.46, 1.24, 1.57, 1.75, 0.61, 1.21, 1.99, 1.03, 2.27, 0.68, 1.03, 2.13, 0.92, -0.29, 1.06, 0.44, 4.36, 1.31, 1.11, 0.91, 0.97, 1.34, 1.58, -0.09]}
|
annotations_1/-CSIqCS1WIk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 3.82], [5.0, 7.57], [9.0, 10.52], [11.0, 12.31], [14.0, 15.06], [18.0, 27.65], [30.0, 57.5], [58.0, 60.94], [62.0, 64.1], [67.0, 114.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 100.0, 0.0, 0.0, 0.0, 100.0, 99.8, 98.51, 91.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.82, 2.57, 1.52, 1.31, 1.06, 9.65, 27.5, 2.94, 2.1, 47.57]}
|
annotations_1/-DXQJLwDAwg_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[5.0, 5.73], [7.0, 7.91], [10.0, 10.0], [10.0, 10.49], [11.0, 12.66], [14.0, 14.22], [15.0, 19.21], [21.0, 21.81], [22.0, 23.03], [24.0, 25.22], [26.0, 28.39], [30.0, 33.35], [36.0, 37.74], [39.0, 43.75], [47.0, 48.32], [50.0, 50.84], [52.0, 54.65], [55.0, 55.95], [58.0, 58.68], [60.0, 59.86], [61.0, 61.82], [63.0, 66.48], [67.0, 67.81], [69.0, 69.42], [71.0, 74.07], [76.0, 76.44], [78.0, 78.39], [81.0, 81.19], [85.0, 85.46], [89.0, 89.78], [92.0, 92.52], [93.0, 93.53], [95.0, 95.79], [100.0, 100.55], [102.0, 103.28], [104.0, 104.95], [107.0, 107.64], [113.0, 114.08], [115.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 82.43, 79.07, 0.0, 63.21, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.91, 0.0, 0.49, 1.66, 0.22, 4.21, 0.81, 1.03, 1.22, 2.39, 3.35, 1.74, 4.75, 1.32, 0.84, 2.65, 0.95, 0.68, -0.14, 0.82, 3.48, 0.81, 0.42, 3.07, 0.44, 0.39, 0.19, 0.46, 0.78, 0.52, 0.53, 0.79, 0.55, 1.28, 0.95, 0.64, 1.08, 1.16]}
|
annotations_1/-DXU2ZHuiTs_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[0.0, 1.16], [1.0, 1.54], [8.0, 8.21], [12.0, 11.92], [13.0, 13.73], [16.0, 16.39], [17.0, 17.66], [23.0, 23.04], [27.0, 28.22], [29.0, 29.4], [31.0, 31.45], [33.0, 33.84], [34.0, 34.74], [36.0, 36.83], [39.0, 39.12], [40.0, 40.09], [41.0, 41.81], [48.0, 48.63], [52.0, 51.98], [55.0, 54.97], [56.0, 56.4], [60.0, 60.39], [62.0, 61.87], [63.0, 62.92], [65.0, 65.35], [67.0, 67.31], [69.0, 69.33], [73.0, 73.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.54, 0.21, -0.08, 0.73, 0.39, 0.66, 0.04, 1.22, 0.4, 0.45, 0.84, 0.74, 0.83, 0.12, 0.09, 0.81, 0.63, -0.02, -0.03, 0.4, 0.39, -0.13, -0.08, 0.35, 0.31, 0.33, 0.08]}
|
annotations_1/-DqmTaUK-Ow_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[22.0, 23.33], [24.0, 25.73], [26.0, 34.1], [35.0, 38.38], [40.0, 49.4], [50.0, 52.25], [58.0, 59.34], [65.0, 65.52], [66.0, 66.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.51, 99.31, 68.41, 69.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.33, 1.73, 8.1, 3.38, 9.4, 2.25, 1.34, 0.52, 0.92]}
|
annotations_1/-FQOaUEE69I_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.71], [4.0, 5.95], [15.0, 20.61], [22.0, 22.4], [23.0, 23.7], [24.0, 25.81], [26.0, 27.08], [28.0, 28.34], [30.0, 30.72], [31.0, 34.33], [35.0, 35.33], [40.0, 43.02], [44.0, 46.09], [48.0, 48.52], [50.0, 50.82], [52.0, 52.96], [57.0, 58.06], [62.0, 62.46], [64.0, 64.47], [66.0, 66.34], [68.0, 71.2], [73.0, 73.8], [75.0, 75.46], [77.0, 78.14], [79.0, 81.5], [84.0, 85.72], [87.0, 87.69], [91.0, 91.62], [93.0, 96.11], [97.0, 97.6], [99.0, 100.25], [104.0, 104.4], [107.0, 107.91], [110.0, 110.25], [111.0, 118.81], [120.0, 122.07], [123.0, 137.61], [139.0, 140.41], [143.0, 143.26], [148.0, 151.63], [152.0, 153.86], [154.0, 156.12], [156.0, 157.47], [158.0, 158.62], [160.0, 161.38], [162.0, 165.4], [166.0, 166.48], [167.0, 167.64], [175.0, 180.82]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 39.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 0.0, 99.44, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 34.43, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 56.1, 35.47, 0.0, 0.0, 52.39, 0.0, 47.12, 0.0, 0.0, 0.0, 30.41, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, [["speech", 44.89], ["sidetone", 13.71], ["chirp tone", 11.39]], null, null, null, null, null, null, [["speech", 42.88], ["crackle", 7.42], ["crushing", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.83], ["sine wave", 15.21], ["sidetone", 8.1]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 32.18], ["music", 29.24], ["mains hum", 12.57]], null, null, null, null, [["speech", 36.44], ["sidetone", 31.39], ["music", 8.37]], null, null, null, [["speech", 27.73], ["livestock, farm animals, working animals", 11.15], ["cattle, bovinae", 5.06]], null, null, [["music", 18.98], ["chirp tone", 13.64], ["crushing", 12.95]]], "duration": [0.71, 1.95, 5.61, 0.4, 0.7, 1.81, 1.08, 0.34, 0.72, 3.33, 0.33, 3.02, 2.09, 0.52, 0.82, 0.96, 1.06, 0.46, 0.47, 0.34, 3.2, 0.8, 0.46, 1.14, 2.5, 1.72, 0.69, 0.62, 3.11, 0.6, 1.25, 0.4, 0.91, 0.25, 7.81, 2.07, 14.61, 1.41, 0.26, 3.63, 1.86, 2.12, 1.47, 0.62, 1.38, 3.4, 0.48, 0.64, 5.82]}
|
annotations_1/-FU65KX7aJs_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[9.0, 13.58], [14.0, 15.28], [17.0, 16.95], [19.0, 39.48], [41.0, 52.96], [54.0, 69.43], [70.0, 74.93], [76.0, 77.58], [78.0, 97.44], [98.0, 98.88], [99.0, 100.03], [102.0, 103.03], [104.0, 105.33], [111.0, 111.0], [116.0, 117.07], [121.0, 122.52], [125.0, 125.81], [126.0, 126.32], [126.0, 130.45], [132.0, 132.93], [134.0, 137.42], [138.0, 138.32], [139.0, 139.85], [141.0, 141.89], [145.0, 148.1], [149.0, 149.18], [171.0, 171.22], [171.0, 171.36], [175.0, 174.77]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [59.24, 0.0, 0.0, 30.61, 32.83, 30.67, 39.7, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.69, 0.0, 49.54, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.55], ["didgeridoo", 17.69], ["fly, housefly", 10.38]], [["music", 58.18], ["synthesizer", 12.1], ["hum", 7.36]], [["music", 54.02], ["didgeridoo", 24.44], ["synthesizer", 4.28]], [["wheeze", 12.09], ["speech", 7.39], ["frog", 6.24]], null, [["speech", 38.1], ["animal", 17.99], ["livestock, farm animals, working animals", 12.74]], null, null, null, null, null, null, null, null, null, [["speech", 55.95], ["animal", 9.45], ["whale vocalization", 4.16]], null, [["hum", 29.43], ["mains hum", 18.48], ["music", 9.87]], null, null, null, [["mains hum", 28.61], ["hum", 27.62], ["radio", 8.48]], null, null, null, null], "duration": [4.58, 1.28, -0.05, 20.48, 11.96, 15.43, 4.93, 1.58, 19.44, 0.88, 1.03, 1.03, 1.33, 0.0, 1.07, 1.52, 0.81, 0.32, 4.45, 0.93, 3.42, 0.32, 0.85, 0.89, 3.1, 0.18, 0.22, 0.36, -0.23]}
|
annotations_1/-G7OPYUlnT0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 7.89], [23.0, 23.26], [25.0, 25.29], [31.0, 30.89], [93.0, 93.24]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [-0.11, 0.26, 0.29, -0.11, 0.24]}
|
annotations_1/-H6l6-_elF0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 8.13], [13.0, 14.25], [17.0, 17.69], [20.0, 21.29], [26.0, 37.62], [39.0, 48.19], [52.0, 52.44], [57.0, 57.79], [62.0, 62.53], [66.0, 67.32], [76.0, 76.86], [81.0, 81.7], [85.0, 86.36], [95.0, 96.08], [103.0, 105.76], [114.0, 115.53], [120.0, 120.78], [125.0, 125.81], [133.0, 133.24], [133.0, 138.7], [141.0, 142.01], [144.0, 145.56], [146.0, 148.44], [150.0, 150.35], [154.0, 154.97], [158.0, 157.72], [159.0, 159.95], [163.0, 163.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [96.17, 0.0, 0.0, 0.0, 78.55, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 10.24], ["thunk", 7.46], ["speech", 7.36]], null, null, null, null, null, null, null, null], "duration": [2.13, 1.25, 0.69, 1.29, 11.62, 9.19, 0.44, 0.79, 0.53, 1.32, 0.86, 0.7, 1.36, 1.08, 2.76, 1.53, 0.78, 0.81, 0.24, 5.7, 1.01, 1.56, 2.44, 0.35, 0.97, -0.28, 0.95, 0.65]}
|
annotations_1/-IV-ZZwXUkw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[9.0, 26.13], [29.0, 30.69], [35.0, 40.22], [41.0, 43.88], [47.0, 52.44], [52.0, 116.23], [118.0, 124.95], [125.0, 163.73]], "keep_status": [false, false, true, true, true, false, true, false], "silence_prob": [30.6, 0.0, 28.97, 29.44, 28.46, 0.0, 28.72, 0.0], "audiomae_on_audioset": [[["throbbing", 56.58], ["hum", 10.19], ["music", 9.05]], null, [["music", 33.25], ["grunt", 15.2], ["fart", 12.17]], [["breaking", 28.12], ["whack, thwack", 15.12], ["music", 8.46]], [["zipper (clothing)", 30.8], ["whack, thwack", 11.18], ["smash, crash", 7.28]], null, [["groan", 18.26], ["music", 13.46], ["whack, thwack", 11.18]], null], "duration": [17.13, 1.69, 5.22, 2.88, 5.44, 64.23, 6.95, 38.73]}
|
annotations_1/-JNyHnAi8zk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 20.11], [20.0, 20.73], [22.0, 23.35], [24.0, 25.44], [26.0, 35.33], [39.0, 40.05], [42.0, 53.35], [54.0, 55.71], [57.0, 57.11], [59.0, 65.6], [68.0, 85.14], [91.0, 100.55], [103.0, 119.28], [121.0, 123.5], [126.0, 148.81], [149.0, 150.21], [151.0, 151.56], [153.0, 170.6]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.69, 0.0, 0.0, 0.0, 28.99, 0.0, 29.89, 0.0, 0.0, 28.67, 28.77, 28.61, 28.68, 29.78, 28.67, 0.0, 0.0, 29.53], "audiomae_on_audioset": [[["music", 45.86], ["speech", 33.8], ["crowd", 1.63]], null, null, null, [["music", 48.28], ["speech", 5.84], ["buzz", 2.5]], null, [["music", 56.42], ["musical instrument", 3.38], ["middle eastern music", 3.11]], null, null, [["music", 55.47], ["speech", 22.82], ["electronic music", 4.18]], [["music", 61.66], ["speech", 7.65], ["vehicle", 5.05]], [["music", 91.63], ["ice cream truck, ice cream van", 1.27], ["speech", 1.13]], [["music", 83.45], ["speech", 12.02], ["electronic music", 0.56]], [["music", 44.67], ["middle eastern music", 9.38], ["musical instrument", 6.41]], [["music", 85.64], ["electronic music", 5.03], ["speech", 1.37]], null, null, [["music", 60.08], ["speech", 15.87], ["vehicle", 1.54]]], "duration": [12.11, 0.73, 1.35, 1.44, 9.33, 1.05, 11.35, 1.71, 0.11, 6.6, 17.14, 9.55, 16.28, 2.5, 22.81, 1.21, 0.56, 17.6]}
|
annotations_1/-Jf-E7oEguU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 94.05]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [88.05]}
|
annotations_1/-JhNO_E3aEE_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 6.03], [7.0, 7.7], [8.0, 8.18], [10.0, 10.69], [12.0, 12.23], [14.0, 14.5], [24.0, 24.92], [26.0, 29.08], [30.0, 29.83], [31.0, 31.11], [32.0, 31.85], [33.0, 33.91], [38.0, 44.12], [45.0, 45.59], [46.0, 47.22], [48.0, 49.91], [51.0, 52.44], [54.0, 67.9], [69.0, 73.95], [76.0, 76.25], [77.0, 82.76], [84.0, 83.98], [85.0, 88.94], [91.0, 93.24], [94.0, 94.91], [96.0, 96.23], [97.0, 100.84], [102.0, 102.86], [104.0, 104.73], [106.0, 107.47], [112.0, 113.88], [115.0, 116.78], [118.0, 118.57], [119.0, 121.81], [123.0, 132.49], [134.0, 134.79], [135.0, 180.39], [181.0, 185.43], [187.0, 191.66], [193.0, 196.94], [200.0, 204.26], [209.0, 211.94], [214.0, 218.13], [218.0, 220.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.56, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 64.52, 45.75, 0.0, 96.77, 0.0, 58.89, 82.61, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 97.83, 0.0, 0.0, 99.31, 94.37, 81.71, 79.94, 81.17, 72.75, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 73.25], ["thunk", 3.4], ["inside, small room", 1.41]], null, null, null, null, [["speech", 48.32], ["heart sounds, heartbeat", 12.75], ["stomach rumble", 11.88]], null, null, null, null, null, [["hum", 46.92], ["mains hum", 17.11], ["speech", 7.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.03, 0.7, 0.18, 0.69, 0.23, 0.5, 0.92, 3.08, -0.17, 0.11, -0.15, 0.91, 6.12, 0.59, 1.22, 1.91, 1.44, 13.9, 4.95, 0.25, 5.76, -0.02, 3.94, 2.24, 0.91, 0.23, 3.84, 0.86, 0.73, 1.47, 1.88, 1.78, 0.57, 2.81, 9.49, 0.79, 45.39, 4.43, 4.66, 3.94, 4.26, 2.94, 4.13, 2.75]}
|
annotations_1/-KVNfZo-cfc_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 2.86], [4.0, 5.04], [6.0, 6.08], [10.0, 10.3], [11.0, 11.26], [12.0, 12.56], [15.0, 15.16], [18.0, 18.81], [21.0, 22.84], [23.0, 25.29], [26.0, 29.89], [33.0, 34.5], [36.0, 36.78], [37.0, 37.98], [39.0, 39.39], [40.0, 43.23], [46.0, 46.89], [48.0, 48.2], [49.0, 49.25], [50.0, 50.18], [50.0, 52.25], [55.0, 55.22], [56.0, 58.29], [60.0, 60.27], [63.0, 63.54], [66.0, 66.61], [71.0, 71.76], [91.0, 91.54], [93.0, 94.46], [95.0, 96.9], [98.0, 99.03], [100.0, 101.51], [102.0, 104.38], [106.0, 107.45], [109.0, 111.77], [113.0, 116.13], [118.0, 118.77], [120.0, 120.95], [122.0, 123.48], [126.0, 127.28], [128.0, 129.29], [131.0, 133.98], [136.0, 137.96], [139.0, 147.39], [151.0, 152.29], [155.0, 155.92], [158.0, 161.6], [168.0, 169.25], [171.0, 171.21], [173.0, 173.45], [175.0, 176.98], [180.0, 184.87], [186.0, 188.87], [190.0, 191.42], [193.0, 194.78], [196.0, 196.45], [198.0, 199.35], [201.0, 201.55], [203.0, 204.31], [205.0, 206.95], [209.0, 209.39], [210.0, 224.24], [228.0, 229.17], [231.0, 235.28], [236.0, 239.79], [241.0, 242.06], [244.0, 248.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 94.37, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 99.59, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 96.42, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 99.95, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.2, 0.0, 85.17, 92.15, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 60.93], ["speech", 6.52], ["sidetone", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 38.5], ["mains hum", 24.84], ["throbbing", 16.21]], null, null, null, null, null], "duration": [0.86, 1.04, 0.08, 0.3, 0.26, 0.56, 0.16, 0.81, 1.84, 2.29, 3.89, 1.5, 0.78, 0.98, 0.39, 3.23, 0.89, 0.2, 0.25, 0.18, 2.25, 0.22, 2.29, 0.27, 0.54, 0.61, 0.76, 0.54, 1.46, 1.9, 1.03, 1.51, 2.38, 1.45, 2.77, 3.13, 0.77, 0.95, 1.48, 1.28, 1.29, 2.98, 1.96, 8.39, 1.29, 0.92, 3.6, 1.25, 0.21, 0.45, 1.98, 4.87, 2.87, 1.42, 1.78, 0.45, 1.35, 0.55, 1.31, 1.95, 0.39, 14.24, 1.17, 4.28, 3.79, 1.06, 4.41]}
|
annotations_1/-KW0wz1xBfw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[13.0, 13.09], [17.0, 19.9], [20.0, 26.03], [26.0, 26.5], [27.0, 27.62], [28.0, 27.89], [29.0, 29.64], [32.0, 96.55], [100.0, 121.73], [122.0, 127.13], [128.0, 130.57], [132.0, 134.91], [136.0, 138.37]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 63.53, 39.72, 0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 99.99, 90.95, 99.26, 60.6], "audiomae_on_audioset": [null, null, [["music", 51.35], ["theremin", 7.7], ["singing bowl", 5.05]], null, null, null, null, null, [["rumble", 19.05], ["explosion", 14.27], ["hum", 9.71]], null, null, null, null], "duration": [0.09, 2.9, 6.03, 0.5, 0.62, -0.11, 0.64, 64.55, 21.73, 5.13, 2.57, 2.91, 2.37]}
|
annotations_1/-Koj9hvcBMk_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[23.0, 24.63], [25.0, 26.52], [27.0, 28.17], [37.0, 38.55], [43.0, 46.13], [47.0, 47.44], [48.0, 48.81], [51.0, 51.66], [53.0, 53.89], [56.0, 56.54], [58.0, 58.01], [59.0, 59.56], [61.0, 61.11], [77.0, 82.56], [85.0, 86.1], [86.0, 86.97], [89.0, 90.24], [98.0, 98.22], [99.0, 99.0], [104.0, 104.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.63, 1.52, 1.17, 1.55, 3.13, 0.44, 0.81, 0.66, 0.89, 0.54, 0.01, 0.56, 0.11, 5.56, 1.1, 0.97, 1.24, 0.22, 0.0, 0.63]}
|
annotations_1/-Kztqrjp2yw_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 1.75], [3.0, 3.5], [5.0, 5.48], [6.0, 6.67], [8.0, 90.78], [92.0, 92.53], [94.0, 97.19], [99.0, 102.49], [106.0, 107.77], [111.0, 114.93], [116.0, 117.59], [119.0, 122.47], [127.0, 129.19], [133.0, 133.78], [136.0, 140.86], [144.0, 144.32], [147.0, 160.79], [162.0, 175.36], [177.0, 184.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 99.84, 0.0, 100.0, 0.0, 99.76, 81.0, 0.0, 59.15, 0.0, 30.67, 32.25, 55.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 38.68], ["cattle, bovinae", 31.7], ["moo", 22.6]], [["music", 14.27], ["fly, housefly", 11.78], ["sidetone", 7.68]], null], "duration": [-0.25, 0.5, 0.48, 0.67, 82.78, 0.53, 3.19, 3.49, 1.77, 3.93, 1.59, 3.47, 2.19, 0.78, 4.86, 0.32, 13.79, 13.36, 7.47]}
|
annotations_1/-LCqZeb1de0_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[6.0, 7.48], [9.0, 10.02], [14.0, 15.04], [16.0, 20.28], [23.0, 23.09], [26.0, 26.22], [28.0, 28.29], [33.0, 35.14], [36.0, 38.13], [46.0, 47.95], [54.0, 62.11], [69.0, 69.99], [75.0, 88.37], [90.0, 90.59], [92.0, 92.67], [95.0, 103.05], [106.0, 108.55], [112.0, 113.0], [116.0, 123.25], [126.0, 127.82], [134.0, 135.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 89.9, 60.89, 0.0, 92.97, 0.0, 99.98, 0.0, 0.0, 99.88, 99.95, 0.0, 83.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.02, 1.04, 4.28, 0.09, 0.22, 0.29, 2.14, 2.13, 1.95, 8.11, 0.99, 13.37, 0.59, 0.67, 8.05, 2.55, 1.0, 7.25, 1.82, 1.94]}
|
annotations_1/-Lrndfrc9yU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []}
|
annotations_1/-MNpOKICOx8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 3.3], [5.0, 7.89], [10.0, 9.78], [11.0, 11.89], [18.0, 19.74], [22.0, 25.59], [26.0, 26.35], [34.0, 35.4], [38.0, 37.99], [48.0, 49.69], [50.0, 50.25], [51.0, 52.41], [54.0, 57.33], [59.0, 60.99], [63.0, 63.59], [64.0, 64.35], [66.0, 77.57], [80.0, 81.77], [86.0, 93.02], [93.0, 94.74], [96.0, 96.84], [97.0, 100.74], [103.0, 103.17], [106.0, 106.57], [112.0, 113.22], [114.0, 117.83], [118.0, 119.85], [121.0, 121.36], [122.0, 123.42], [124.0, 132.61], [133.0, 134.64], [138.0, 138.86], [140.0, 140.0]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.26, 0.0, 0.0, 0.0, 36.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 45.49, 0.0, 67.13, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 27.19], ["speech", 12.83], ["fly, housefly", 12.71]], null, null, null, [["music", 22.44], ["speech", 13.4], ["frog", 11.1]], null, null, null, null, null, null, null, null, null, null, [["thunk", 77.32], ["music", 10.1], ["mosquito", 3.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 2.89, -0.22, 0.89, 1.74, 3.59, 0.35, 1.4, -0.01, 1.69, 0.25, 1.41, 3.33, 1.99, 0.59, 0.35, 11.57, 1.77, 7.02, 1.74, 0.84, 3.74, 0.17, 0.57, 1.22, 3.83, 1.85, 0.36, 1.42, 8.61, 1.64, 0.86, 0.0]}
|
annotations_1/-Nzbwerwks8_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 1.93], [5.0, 5.86], [6.0, 12.97], [18.0, 19.21], [20.0, 23.06], [26.0, 28.95], [34.0, 39.63], [42.0, 42.09], [43.0, 44.83], [50.0, 54.41], [55.0, 73.7], [79.0, 82.31], [84.0, 84.86], [86.0, 92.77], [98.0, 101.33], [105.0, 108.51], [115.0, 119.62]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 39.11, 0.0, 34.11, 33.41, 31.43, 0.0, 0.0, 31.21, 30.91, 30.75, 0.0, 31.68, 47.54, 36.56, 32.04], "audiomae_on_audioset": [null, null, [["speech", 47.52], ["music", 15.35], ["hum", 12.1]], null, [["speech", 52.2], ["music", 8.99], ["sidetone", 8.27]], [["speech", 57.53], ["fly, housefly", 6.35], ["music", 3.85]], [["speech", 22.43], ["fart", 12.6], ["cattle, bovinae", 9.65]], null, null, [["speech", 71.3], ["music", 6.04], ["explosion", 2.52]], [["speech", 70.13], ["breaking", 8.66], ["music", 4.96]], [["speech", 63.9], ["music", 4.9], ["explosion", 3.03]], null, [["whack, thwack", 26.01], ["music", 22.96], ["groan", 9.42]], [["throbbing", 19.86], ["fly, housefly", 16.49], ["music", 11.74]], [["music", 42.78], ["hum", 13.51], ["didgeridoo", 6.94]], [["music", 41.78], ["speech", 22.02], ["drum machine", 6.29]]], "duration": [0.93, 0.86, 6.97, 1.21, 3.06, 2.95, 5.63, 0.09, 1.83, 4.41, 18.7, 3.31, 0.86, 6.77, 3.33, 3.51, 4.62]}
|
annotations_1/-OMiOIbouaA_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 11.3], [12.0, 13.78], [15.0, 16.83], [17.0, 26.6], [29.0, 41.88], [43.0, 44.95], [46.0, 48.12], [57.0, 61.13], [62.0, 63.8], [76.0, 76.89], [80.0, 80.7], [83.0, 85.8], [89.0, 89.38], [90.0, 90.83], [92.0, 92.16], [97.0, 98.05], [98.0, 102.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [96.17, 0.0, 0.0, 96.29, 91.64, 0.0, 93.76, 81.53, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.53], ["speech", 9.03], ["telephone", 2.99]]], "duration": [3.3, 1.78, 1.83, 9.6, 12.88, 1.95, 2.12, 4.13, 1.8, 0.89, 0.7, 2.8, 0.38, 0.83, 0.16, 1.05, 4.69]}
|
annotations_1/-ON8ZTCiuYo_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[18.0, 19.47], [22.0, 22.92], [25.0, 30.74], [32.0, 38.31], [39.0, 39.31], [41.0, 52.03], [55.0, 57.35], [60.0, 65.16], [65.0, 66.8], [69.0, 72.5], [73.0, 75.17], [76.0, 81.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.82, 85.17, 0.0, 86.82, 38.59, 56.33, 0.0, 66.15, 57.09, 68.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 32.95], ["chirp tone", 25.13], ["tuning fork", 17.12]], null, null, null, null, null], "duration": [1.47, 0.92, 5.74, 6.31, 0.31, 11.03, 2.35, 5.16, 1.8, 3.5, 2.17, 5.53]}
|
annotations_1/-OUuZojE3aM_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[32.0, 33.02], [33.0, 35.07], [36.0, 100.26], [101.0, 101.66], [102.0, 104.99], [106.0, 132.7], [133.0, 144.86], [146.0, 161.6], [162.0, 161.64], [162.0, 161.72], [162.0, 161.77], [162.0, 162.01], [162.0, 162.06], [162.0, 162.13], [162.0, 162.16], [162.0, 162.3], [162.0, 162.45], [162.0, 162.48], [164.0, 168.07]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 70.16, 0.0, 0.0, 38.05, 44.2, 63.74, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, null, [["speech", 65.43], ["music", 11.35], ["inside, small room", 3.15]], [["music", 33.49], ["synthesizer", 10.78], ["sine wave", 7.62]], null, [["music", 49.94], ["theremin", 12.22], ["singing bowl", 7.74]], null, null, null, null, null, null, null, null, null, null, [["whimper", 30.1], ["speech", 8.43], ["groan", 7.73]]], "duration": [1.02, 2.07, 64.26, 0.66, 2.99, 26.7, 11.86, 15.6, -0.36, -0.28, -0.23, 0.01, 0.06, 0.13, 0.16, 0.3, 0.45, 0.48, 4.07]}
|
annotations_1/-QT_Af7RLjU_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 16.73], [17.0, 18.45], [23.0, 24.22], [34.0, 34.18], [38.0, 38.35], [42.0, 41.71], [42.0, 42.01], [48.0, 52.41], [57.0, 57.13], [58.0, 59.0], [66.0, 66.19], [69.0, 68.91], [74.0, 76.0], [79.0, 80.03], [82.0, 83.15], [84.0, 94.04], [102.0, 101.65], [102.0, 101.76], [113.0, 113.32], [122.0, 130.72], [133.0, 133.84]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 37.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 27.06], ["animal", 11.71], ["whale vocalization", 10.93]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.45], ["whack, thwack", 3.97], ["breaking", 2.23]], null], "duration": [8.73, 1.45, 1.22, 0.18, 0.35, -0.29, 0.01, 4.41, 0.13, 1.0, 0.19, -0.09, 2.0, 1.03, 1.15, 10.04, -0.35, -0.24, 0.32, 8.72, 0.84]}
|
annotations_1/-QZzReak2Ck_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[73.0, 93.02], [96.0, 97.28], [98.0, 101.12], [101.0, 103.42], [104.0, 104.9], [106.0, 107.84], [109.0, 113.1], [114.0, 114.67], [118.0, 120.85], [122.0, 121.85], [123.0, 151.38], [151.0, 151.41], [151.0, 151.44], [151.0, 151.48], [153.0, 156.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.12, 0.0, 66.03, 54.17, 0.0, 0.0, 72.31, 0.0, 35.37, 0.0, 32.58, 0.0, 0.0, 0.0, 81.71], "audiomae_on_audioset": [[["music", 43.13], ["throbbing", 20.27], ["hum", 15.46]], null, null, null, null, null, null, null, [["music", 73.1], ["speech", 5.41], ["didgeridoo", 4.54]], null, [["music", 50.95], ["speech", 24.54], ["whack, thwack", 2.62]], null, null, null, null], "duration": [20.02, 1.28, 3.12, 2.42, 0.9, 1.84, 4.1, 0.67, 2.85, -0.15, 28.38, 0.41, 0.44, 0.48, 3.09]}
|
annotations_1/-QfKnft9uWY_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[76.0, 76.37], [76.0, 76.4], [83.0, 87.86], [90.0, 95.49], [100.0, 141.94], [144.0, 149.89]], "keep_status": [false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 35.27, 39.77, 0.0, 31.75], "audiomae_on_audioset": [null, null, [["speech", 42.89], ["radio", 15.68], ["sidetone", 7.55]], [["fart", 25.2], ["speech", 23.95], ["fly, housefly", 8.6]], null, [["fart", 49.09], ["music", 8.72], ["sound effect", 4.1]]], "duration": [0.37, 0.4, 4.86, 5.49, 41.94, 5.89]}
|
annotations_1/-Qq6ZZy0yGg_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[1.0, 1.61], [3.0, 2.98], [7.0, 7.15], [13.0, 16.6], [17.0, 18.42], [22.0, 23.35], [26.0, 30.0], [36.0, 37.71], [45.0, 50.68], [61.0, 85.45], [85.0, 85.51], [88.0, 121.51], [127.0, 166.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.34, 0.0, 0.0, 29.25, 0.0, 29.51, 29.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.78], ["speech", 24.0], ["sidetone", 3.84]], null, null, [["music", 76.68], ["musical instrument", 4.58], ["speech", 2.85]], null, [["music", 74.26], ["boing", 4.46], ["musical instrument", 4.37]], [["music", 81.65], ["didgeridoo", 3.24], ["musical instrument", 1.66]], null, null, null], "duration": [0.61, -0.02, 0.15, 3.6, 1.42, 1.35, 4.0, 1.71, 5.68, 24.45, 0.51, 33.51, 39.8]}
|
annotations_1/-SkeK7t74oo_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[8.0, 9.29], [14.0, 15.6], [16.0, 16.36], [17.0, 23.04], [33.0, 33.61], [40.0, 41.99], [45.0, 44.93], [47.0, 51.95], [60.0, 72.52], [82.0, 83.03], [88.0, 94.61], [99.0, 104.11], [105.0, 114.79], [118.0, 119.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 31.13, 32.7, 0.0, 33.21, 33.52, 34.03, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 53.63], ["speech", 13.05], ["saxophone", 3.62]], null, null, null, [["sidetone", 62.27], ["music", 15.8], ["throbbing", 3.05]], [["music", 47.52], ["speech", 27.62], ["sidetone", 5.08]], null, [["music", 61.33], ["sidetone", 11.47], ["speech", 6.25]], [["music", 60.48], ["house music", 4.09], ["sampler", 2.07]], [["music", 57.62], ["hum", 9.52], ["saxophone", 3.15]], null], "duration": [1.29, 1.6, 0.36, 6.04, 0.61, 1.99, -0.07, 4.95, 12.52, 1.03, 6.61, 5.11, 9.79, 1.1]}
|
annotations_1/-Svsz19yyPM_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[2.0, 4.4], [9.0, 9.22], [11.0, 18.03], [19.0, 19.53], [21.0, 28.49], [31.0, 76.1], [78.0, 81.51], [84.0, 92.16], [94.0, 99.94], [102.0, 102.32], [103.0, 103.5], [106.0, 105.85], [106.0, 106.84], [109.0, 109.0], [111.0, 111.48], [112.0, 114.94], [120.0, 121.19], [123.0, 124.21], [126.0, 140.12], [141.0, 149.39], [153.0, 155.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 96.04, 0.0, 51.39, 0.0, 89.54, 68.67, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 45.46, 42.88, 45.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.66], ["sampler", 4.29], ["drum machine", 4.04]], [["music", 46.72], ["hum", 17.85], ["throbbing", 13.36]], [["beatboxing", 56.92], ["music", 17.26], ["speech", 6.22]]], "duration": [2.4, 0.22, 7.03, 0.53, 7.49, 45.1, 3.51, 8.16, 5.94, 0.32, 0.5, -0.15, 0.84, 0.0, 0.48, 2.94, 1.19, 1.21, 14.12, 8.39, 2.07]}
|
annotations_1/-U9v7Nz6hOs_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[0.0, 1.0], [9.0, 10.74], [12.0, 12.11], [13.0, 14.52], [17.0, 23.11], [34.0, 55.49], [56.0, 64.27], [65.0, 67.34], [69.0, 68.91], [70.0, 70.88], [72.0, 85.77], [90.0, 89.95], [91.0, 91.0], [93.0, 98.34], [105.0, 120.36], [125.0, 126.33], [128.0, 134.54], [140.0, 140.73], [155.0, 155.34]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.42, 28.95, 29.06, 29.26, 0.0, 0.0, 29.05, 0.0, 0.0, 30.22, 30.86, 0.0, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.5], ["quack", 6.9], ["livestock, farm animals, working animals", 2.75]], [["music", 53.48], ["speech", 18.34], ["electronic music", 10.32]], [["music", 12.99], ["vehicle", 11.55], ["whale vocalization", 8.26]], [["boing", 37.71], ["moo", 26.01], ["cattle, bovinae", 22.73]], null, null, [["music", 24.18], ["speech", 15.5], ["whip", 11.98]], null, null, [["speech", 60.38], ["hum", 12.69], ["music", 5.85]], [["music", 22.26], ["hum", 18.96], ["throbbing", 14.4]], null, [["music", 69.37], ["theremin", 10.04], ["musical instrument", 4.35]], null, null], "duration": [1.0, 1.74, 0.11, 1.52, 6.11, 21.49, 8.27, 2.34, -0.09, 0.88, 13.77, -0.05, 0.0, 5.34, 15.36, 1.33, 6.54, 0.73, 0.34]}
|
annotations_1/-VnQ_KpOBm4_filtered.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"non_speech_segments": [[3.0, 3.13], [4.0, 6.37], [13.0, 13.83], [17.0, 18.18], [19.0, 19.92], [27.0, 27.75], [29.0, 30.13], [34.0, 34.05], [35.0, 35.58], [41.0, 42.55], [46.0, 46.6], [49.0, 50.14], [51.0, 51.14], [52.0, 52.86], [54.0, 55.53], [57.0, 57.16], [62.0, 62.06], [63.0, 64.45], [66.0, 66.7], [69.0, 69.74], [72.0, 72.62], [76.0, 76.57], [79.0, 80.2], [82.0, 84.45], [88.0, 88.94], [91.0, 91.25], [92.0, 92.21], [94.0, 94.34], [96.0, 96.82], [100.0, 100.18], [103.0, 103.4], [106.0, 106.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.03], ["musical instrument", 13.94], ["guitar", 13.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.35], ["speech", 8.29], ["musical instrument", 4.71]], null, null, null, null, null, null, null, null], "duration": [0.13, 2.37, 0.83, 1.18, 0.92, 0.75, 1.13, 0.05, 0.58, 1.55, 0.6, 1.14, 0.14, 0.86, 1.53, 0.16, 0.06, 1.45, 0.7, 0.74, 0.62, 0.57, 1.2, 2.45, 0.94, 0.25, 0.21, 0.34, 0.82, 0.18, 0.4, 0.76]}
|