diff --git a/annotations_filtered/--ABd2SeIGE_filtered.json b/annotations_filtered/--ABd2SeIGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfd6a9a878edcc2ca6d7b9beeb40ae13edd76ae3 --- /dev/null +++ b/annotations_filtered/--ABd2SeIGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.75], [15.0, 23.94], [27.0, 37.12], [48.0, 47.83], [51.0, 51.43], [60.0, 60.0], [62.0, 69.42], [86.0, 86.32], [93.0, 96.79], [98.0, 98.36], [99.0, 99.6], [100.0, 102.39], [106.0, 113.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.94, 30.17, 46.33, 0.0, 0.0, 0.0, 68.15, 0.0, 61.97, 0.0, 0.0, 38.33, 39.55], "audiomae_on_audioset": [[["theremin", 29.79], ["music", 28.67], ["hum", 7.9]], [["speech", 57.27], ["explosion", 14.36], ["burst, pop", 7.06]], [["music", 62.43], ["theremin", 8.26], ["cello", 4.68]], null, null, null, null, null, null, null, null, [["music", 21.78], ["musical instrument", 6.05], ["didgeridoo", 5.51]], [["music", 76.58], ["musical instrument", 3.22], ["theremin", 2.27]]], "duration": [4.75, 8.94, 10.12, -0.17, 0.43, 0.0, 7.42, 0.32, 3.79, 0.36, 0.6, 2.39, 7.46]} \ No newline at end of file diff --git a/annotations_filtered/--Jiv5iYqT8_filtered.json b/annotations_filtered/--Jiv5iYqT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb566ba2d8bf593054ae5517d8135aff584a2401 --- /dev/null +++ b/annotations_filtered/--Jiv5iYqT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [7.0, 8.21], [9.0, 12.63], [13.0, 15.26], [17.0, 19.16], [20.0, 23.95], [25.0, 30.32], [31.0, 41.57], [43.0, 54.11], [55.0, 58.31], [59.0, 61.94], [64.0, 99.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 100.0, 100.0, 100.0, 100.0, 99.93, 99.95, 99.98, 77.53, 81.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 1.21, 3.63, 2.26, 2.16, 3.95, 5.32, 10.57, 11.11, 3.31, 2.94, 35.55]} \ No newline at end of file diff --git a/annotations_filtered/--QCZKgJt6o_filtered.json b/annotations_filtered/--QCZKgJt6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda0024e4d05408c81e5065bd4807b883aae16d6 --- /dev/null +++ b/annotations_filtered/--QCZKgJt6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 6.37], [7.0, 9.76], [14.0, 16.93], [30.0, 31.36], [33.0, 33.54], [35.0, 35.72], [40.0, 46.94], [51.0, 50.68], [52.0, 61.47], [67.0, 69.9], [77.0, 77.35], [107.0, 108.08], [117.0, 117.19], [117.0, 118.18], [127.0, 128.22], [133.0, 134.74], [136.0, 136.24], [140.0, 142.8], [146.0, 149.35], [151.0, 151.31], [152.0, 153.35], [156.0, 156.61], [157.0, 159.6], [164.0, 165.43], [174.0, 175.02]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 60.89, 45.59, 0.0, 0.0, 0.0, 35.85, 0.0, 34.71, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 47.2, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.24], ["vocal music", 7.63], ["singing", 6.21]], null, null, null, [["speech", 18.36], ["moo", 9.75], ["livestock, farm animals, working animals", 8.42]], null, [["chant", 14.05], ["cattle, bovinae", 12.42], ["grunt", 10.88]], null, null, null, null, null, null, null, null, null, [["speech", 49.28], ["hum", 8.71], ["music", 5.69]], null, null, null, [["speech", 31.98], ["music", 6.36], ["hum", 5.44]], null, null], "duration": [1.3, 1.37, 2.76, 2.93, 1.36, 0.54, 0.72, 6.94, -0.32, 9.47, 2.9, 0.35, 1.08, 0.19, 1.18, 1.22, 1.74, 0.24, 2.8, 3.35, 0.31, 1.35, 0.61, 2.6, 1.43, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/--aqjaJyZLk_filtered.json b/annotations_filtered/--aqjaJyZLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fef66f9888c21a51b1ab6ac7b8aeae14a9984fe --- /dev/null +++ b/annotations_filtered/--aqjaJyZLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.62], [19.0, 22.18], [24.0, 25.74], [26.0, 26.6], [29.0, 33.02], [41.0, 42.13], [46.0, 46.55], [47.0, 48.63], [50.0, 51.17], [54.0, 55.27], [56.0, 57.32], [58.0, 59.81], [63.0, 63.49], [69.0, 69.21], [70.0, 72.59], [75.0, 75.64], [77.0, 78.58], [81.0, 81.77], [83.0, 83.69], [85.0, 85.83], [87.0, 88.38], [89.0, 90.8], [91.0, 91.88], [92.0, 92.64], [95.0, 97.17], [98.0, 106.57], [108.0, 109.51], [110.0, 111.52], [112.0, 115.32], [118.0, 120.87]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [52.27, 54.97, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 37.26, 0.0, 0.0, 31.3, 58.72], "audiomae_on_audioset": [null, null, null, null, [["noise", 17.53], ["hum", 14.74], ["music", 12.08]], null, null, null, null, null, null, null, null, null, [["music", 42.85], ["speech", 9.51], ["hum", 6.87]], null, null, null, null, null, null, null, null, null, [["tuning fork", 85.18], ["coin (dropping)", 2.94], ["gong", 2.22]], [["music", 39.36], ["mechanisms", 7.52], ["hum", 6.54]], null, null, [["music", 14.77], ["clang", 10.79], ["fly, housefly", 8.68]], null], "duration": [7.62, 3.18, 1.74, 0.6, 4.02, 1.13, 0.55, 1.63, 1.17, 1.27, 1.32, 1.81, 0.49, 0.21, 2.59, 0.64, 1.58, 0.77, 0.69, 0.83, 1.38, 1.8, 0.88, 0.64, 2.17, 8.57, 1.51, 1.52, 3.32, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/--hendERqm0_filtered.json b/annotations_filtered/--hendERqm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0669cccee3e71d295a6ed82416912baafbbf25a --- /dev/null +++ b/annotations_filtered/--hendERqm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [14.0, 14.22], [16.0, 21.17], [28.0, 28.76], [32.0, 32.95], [34.0, 34.42], [36.0, 36.15], [38.0, 38.06], [40.0, 40.63], [41.0, 51.34], [53.0, 56.84], [58.0, 59.12], [61.0, 62.31], [66.0, 67.93], [70.0, 71.29], [74.0, 74.75], [77.0, 78.38], [82.0, 84.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.77, 31.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95], "audiomae_on_audioset": [null, null, [["music", 67.55], ["electronic music", 5.78], ["house music", 4.08]], null, null, null, null, null, null, [["music", 45.64], ["speech", 12.16], ["techno", 9.56]], [["music", 51.69], ["speech", 33.92], ["drum machine", 1.58]], null, null, null, null, null, null, [["music", 30.48], ["sonar", 30.27], ["electronic music", 9.0]]], "duration": [0.56, 0.22, 5.17, 0.76, 0.95, 0.42, 0.15, 0.06, 0.63, 10.34, 3.84, 1.12, 1.31, 1.93, 1.29, 0.75, 1.38, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/--oCWVOBuvA_filtered.json b/annotations_filtered/--oCWVOBuvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70582ee9764aba4fc5659eedfce78ae528b5019d --- /dev/null +++ b/annotations_filtered/--oCWVOBuvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [4.0, 5.46], [7.0, 7.35], [9.0, 12.02], [13.0, 14.1], [16.0, 17.66], [20.0, 21.22], [24.0, 26.03], [27.0, 28.41], [32.0, 32.81], [36.0, 36.37], [38.0, 38.4], [41.0, 47.61], [49.0, 51.41], [55.0, 56.3], [58.0, 58.21], [60.0, 64.56], [66.0, 66.36], [67.0, 68.35], [70.0, 72.81], [74.0, 75.02], [77.0, 78.65], [80.0, 81.68], [83.0, 83.17], [84.0, 87.4], [88.0, 92.03], [94.0, 95.12], [98.0, 99.33], [102.0, 101.78], [103.0, 105.87], [106.0, 106.83], [109.0, 109.81], [112.0, 113.04], [118.0, 119.72], [121.0, 121.34], [126.0, 126.22], [129.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 94.95, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 1.46, 0.35, 3.02, 1.1, 1.66, 1.22, 2.03, 1.41, 0.81, 0.37, 0.4, 6.61, 2.41, 1.3, 0.21, 4.56, 0.36, 1.35, 2.81, 1.02, 1.65, 1.68, 0.17, 3.4, 4.03, 1.12, 1.33, -0.22, 2.87, 0.83, 0.81, 1.04, 1.72, 0.34, 0.22, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/--uyzf7X_0c_filtered.json b/annotations_filtered/--uyzf7X_0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7c361ce4257ec00aa89d4a7bfbf7afecc381366 --- /dev/null +++ b/annotations_filtered/--uyzf7X_0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [5.0, 5.07], [8.0, 8.16], [13.0, 12.78], [20.0, 20.21], [24.0, 24.07], [26.0, 26.52], [35.0, 35.53], [40.0, 40.29], [48.0, 48.36], [51.0, 51.54], [54.0, 54.72], [70.0, 69.72], [71.0, 71.68], [74.0, 74.43], [77.0, 76.92], [78.0, 78.51], [82.0, 82.24], [83.0, 83.03], [85.0, 85.31], [88.0, 88.8], [90.0, 90.86], [95.0, 95.47], [100.0, 100.31], [105.0, 105.33], [107.0, 107.01], [111.0, 111.92], [115.0, 115.06], [115.0, 115.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.07, 0.16, -0.22, 0.21, 0.07, 0.52, 0.53, 0.29, 0.36, 0.54, 0.72, -0.28, 0.68, 0.43, -0.08, 0.51, 0.24, 0.03, 0.31, 0.8, 0.86, 0.47, 0.31, 0.33, 0.01, 0.92, 0.06, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/--vFXH3mH3A_filtered.json b/annotations_filtered/--vFXH3mH3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f22b8d376e581b4092ecc95955e2e2a9b86be8d --- /dev/null +++ b/annotations_filtered/--vFXH3mH3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.01], [18.0, 36.73], [38.0, 41.69], [49.0, 51.97], [58.0, 59.56], [61.0, 65.1], [74.0, 82.44], [83.0, 89.94], [90.0, 90.98], [96.0, 98.64], [103.0, 103.92], [108.0, 107.97], [108.0, 109.88], [112.0, 114.1], [118.0, 130.54], [132.0, 133.14], [134.0, 144.76], [147.0, 160.37], [161.0, 166.53], [168.0, 167.9], [170.0, 170.83], [173.0, 172.84]], "keep_status": [true, true, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [28.92, 29.82, 29.42, 29.02, 0.0, 30.59, 29.01, 29.08, 0.0, 29.77, 0.0, 0.0, 0.0, 28.94, 29.1, 0.0, 29.24, 28.93, 30.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 11.06], ["mosquito", 7.33], ["speech", 6.95]], [["rumble", 29.07], ["hum", 13.01], ["mains hum", 12.77]], [["speech", 17.98], ["whale vocalization", 16.64], ["groan", 16.12]], [["music", 63.1], ["speech", 7.17], ["electronic music", 1.88]], null, [["didgeridoo", 33.1], ["speech", 24.81], ["music", 22.07]], [["music", 52.24], ["vehicle", 9.53], ["motorcycle", 2.87]], [["music", 50.65], ["cattle, bovinae", 18.06], ["moo", 9.87]], null, [["music", 25.05], ["cattle, bovinae", 23.46], ["moo", 18.88]], null, null, null, [["groan", 43.37], ["music", 6.03], ["grunt", 5.74]], [["music", 39.13], ["speech", 20.56], ["electronic music", 6.22]], null, [["music", 83.89], ["electronic music", 3.05], ["techno", 1.93]], [["music", 79.27], ["hum", 3.27], ["throbbing", 2.72]], [["fly, housefly", 28.0], ["explosion", 24.83], ["boom", 9.83]], null, null, null], "duration": [7.01, 18.73, 3.69, 2.97, 1.56, 4.1, 8.44, 6.94, 0.98, 2.64, 0.92, -0.03, 1.88, 2.1, 12.54, 1.14, 10.76, 13.37, 5.53, -0.1, 0.83, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/-0SHIbuEO3w_filtered.json b/annotations_filtered/-0SHIbuEO3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca78185f0eca138fe939cf67a75296c5456a9f6 --- /dev/null +++ b/annotations_filtered/-0SHIbuEO3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 60.72], [63.0, 122.66], [127.0, 131.94]], "keep_status": [false, false, true], "silence_prob": [29.36, 0.0, 30.22], "audiomae_on_audioset": [[["music", 65.38], ["speech", 7.81], ["throbbing", 3.28]], null, [["speech", 22.67], ["music", 22.28], ["crowd", 5.83]]], "duration": [4.72, 59.66, 4.94]} \ No newline at end of file diff --git a/annotations_filtered/-0f67QE-HP8_filtered.json b/annotations_filtered/-0f67QE-HP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a4e03c8e60fcd573957293843984d9b0fcc48d3 --- /dev/null +++ b/annotations_filtered/-0f67QE-HP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.85], [2.0, 3.06], [4.0, 7.08], [9.0, 35.92], [38.0, 41.82], [44.0, 45.98], [48.0, 57.75], [58.0, 57.86], [58.0, 93.53], [98.0, 105.11], [110.0, 113.12], [114.0, 115.65], [118.0, 121.74], [132.0, 139.5], [143.0, 142.79], [143.0, 143.9], [148.0, 148.56], [152.0, 157.91], [160.0, 159.92], [161.0, 164.03], [169.0, 169.53], [171.0, 172.02], [181.0, 182.46]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 30.71, 34.35, 0.0, 32.99, 0.0, 0.0, 29.01, 30.45, 0.0, 29.66, 30.04, 0.0, 0.0, 0.0, 31.53, 0.0, 30.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 72.72], ["music", 8.61], ["sidetone", 2.77]], [["music", 57.26], ["throbbing", 8.84], ["hum", 6.68]], null, [["whale vocalization", 88.55], ["music", 6.54], ["musical instrument", 0.81]], null, null, [["speech", 24.98], ["music", 16.76], ["whack, thwack", 8.37]], [["whale vocalization", 77.84], ["mosquito", 3.38], ["moo", 2.41]], null, [["explosion", 30.95], ["burst, pop", 13.91], ["speech", 9.44]], [["speech", 27.71], ["music", 15.41], ["cattle, bovinae", 6.74]], null, null, null, [["music", 32.22], ["electronic music", 12.21], ["dubstep", 7.19]], null, [["speech", 74.27], ["sound effect", 3.57], ["fart", 2.7]], null, null, null], "duration": [0.85, 1.06, 3.08, 26.92, 3.82, 1.98, 9.75, -0.14, 35.53, 7.11, 3.12, 1.65, 3.74, 7.5, -0.21, 0.9, 0.56, 5.91, -0.08, 3.03, 0.53, 1.02, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/-19d_T472co_filtered.json b/annotations_filtered/-19d_T472co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0437989b42eed3a8bcff6d44e94bbfb2b34a546f --- /dev/null +++ b/annotations_filtered/-19d_T472co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 47.21], [48.0, 48.57], [53.0, 53.25], [53.0, 166.8], [167.0, 167.7], [168.0, 173.04], [175.0, 177.45], [180.0, 201.29], [205.0, 205.17], [206.0, 212.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 31.68, 35.71, 0.0, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 76.85], ["speech", 5.82], ["boing", 1.78]], [["music", 32.21], ["fly, housefly", 10.63], ["buzz", 6.42]], null, null], "duration": [46.21, 0.57, 0.25, 113.8, 0.7, 5.04, 2.45, 21.29, 0.17, 6.75]} \ No newline at end of file diff --git a/annotations_filtered/-1U0LH6dPfw_filtered.json b/annotations_filtered/-1U0LH6dPfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16d589653c6457b53773ae82ea14a418f64ce4ab --- /dev/null +++ b/annotations_filtered/-1U0LH6dPfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [3.0, 3.11], [3.0, 4.31], [13.0, 14.22], [22.0, 24.88], [26.0, 31.73], [35.0, 38.31], [39.0, 42.03], [46.0, 56.1], [61.0, 85.5], [98.0, 98.49], [100.0, 107.32], [108.0, 108.38], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.28, 30.67, 30.45, 30.48, 30.16, 30.01, 0.0, 33.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.12], ["didgeridoo", 4.8], ["sidetone", 4.55]], [["music", 62.74], ["hum", 9.5], ["throbbing", 5.24]], [["music", 45.36], ["speech", 19.03], ["boing", 5.23]], [["music", 53.7], ["boing", 15.98], ["fly, housefly", 3.21]], [["music", 60.24], ["speech", 11.81], ["boing", 9.62]], [["music", 68.45], ["boing", 10.58], ["speech", 6.01]], null, [["music", 42.75], ["speech", 18.11], ["mains hum", 12.3]], null, null], "duration": [0.61, 0.11, 1.31, 1.22, 2.88, 5.73, 3.31, 3.03, 10.1, 24.5, 0.49, 7.32, 0.38, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/-1W4xHNKvAk_filtered.json b/annotations_filtered/-1W4xHNKvAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9467dc1ee84c624e60243480b10c88ba9a32fa2 --- /dev/null +++ b/annotations_filtered/-1W4xHNKvAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [16.0, 17.51], [35.0, 35.06], [36.0, 36.69], [50.0, 51.21], [52.0, 53.15], [73.0, 74.11], [85.0, 86.86], [100.0, 101.07], [102.0, 103.08], [114.0, 115.01], [117.0, 117.29], [120.0, 120.75], [135.0, 134.97], [150.0, 150.13], [208.0, 208.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.51, 0.06, 0.69, 1.21, 1.15, 1.11, 1.86, 1.07, 1.08, 1.01, 0.29, 0.75, -0.03, 0.13, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/-1eKufUP5XQ_filtered.json b/annotations_filtered/-1eKufUP5XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..603231b058b6f3ec8a1bba77d02a1e2ab295603a --- /dev/null +++ b/annotations_filtered/-1eKufUP5XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [11.0, 15.52], [20.0, 20.07], [24.0, 24.58], [40.0, 41.15], [44.0, 49.44], [50.0, 51.68], [53.0, 59.09], [64.0, 64.49], [65.0, 65.69], [66.0, 68.1], [79.0, 79.39], [80.0, 80.59], [83.0, 84.33], [89.0, 89.85], [91.0, 97.97], [99.0, 99.39], [100.0, 99.98], [100.0, 102.0], [104.0, 104.41], [105.0, 105.73], [106.0, 106.74], [107.0, 107.97], [110.0, 111.35], [112.0, 113.56], [114.0, 115.64], [116.0, 118.37], [119.0, 123.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.9, 0.0, 0.0, 0.0, 90.25, 0.0, 89.72, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 94.66], "audiomae_on_audioset": [null, [["speech", 27.69], ["whack, thwack", 9.37], ["busy signal", 8.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 4.52, 0.07, 0.58, 1.15, 5.44, 1.68, 6.09, 0.49, 0.69, 2.1, 0.39, 0.59, 1.33, 0.85, 6.97, 0.39, -0.02, 2.0, 0.41, 0.73, 0.74, 0.97, 1.35, 1.56, 1.64, 2.37, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/-1gCG8m1SHU_filtered.json b/annotations_filtered/-1gCG8m1SHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e0dd7621ae07b9d35d61f864c14f726df30cbaa --- /dev/null +++ b/annotations_filtered/-1gCG8m1SHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 21.51], [23.0, 29.44], [31.0, 32.14], [38.0, 40.2], [43.0, 44.31], [47.0, 46.79], [48.0, 50.19], [54.0, 53.77], [59.0, 59.85], [61.0, 61.05], [62.0, 63.46], [64.0, 64.57], [66.0, 66.75], [70.0, 70.95], [72.0, 73.08], [74.0, 74.8], [77.0, 77.3], [78.0, 79.47], [83.0, 84.65], [85.0, 96.15], [99.0, 113.75], [115.0, 123.8], [125.0, 126.12]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [40.95, 98.73, 0.0, 99.73, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99, 31.55, 54.63, 0.0], "audiomae_on_audioset": [[["music", 35.95], ["hum", 13.7], ["noise", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.38], ["theremin", 8.86], ["hum", 4.46]], [["music", 47.45], ["hum", 18.65], ["throbbing", 9.19]], null, null], "duration": [17.51, 6.44, 1.14, 2.2, 1.31, -0.21, 2.19, -0.23, 0.85, 0.05, 1.46, 0.57, 0.75, 0.95, 1.08, 0.8, 0.3, 1.47, 1.65, 11.15, 14.75, 8.8, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/-1zLU5N6uBU_filtered.json b/annotations_filtered/-1zLU5N6uBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-1zLU5N6uBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-2KG4lLGEl0_filtered.json b/annotations_filtered/-2KG4lLGEl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a192524a4650c9672d503b8d0142c2a17d6edce2 --- /dev/null +++ b/annotations_filtered/-2KG4lLGEl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.27], [14.0, 15.26], [21.0, 21.66], [27.0, 27.48], [31.0, 32.09], [34.0, 34.03], [34.0, 34.96], [36.0, 36.54], [38.0, 39.01], [41.0, 42.52], [43.0, 43.6], [46.0, 46.41], [47.0, 49.2], [51.0, 51.33], [54.0, 55.85], [57.0, 58.55], [68.0, 68.88], [79.0, 79.73], [80.0, 80.94], [84.0, 84.54], [87.0, 87.52], [89.0, 90.24], [101.0, 101.85], [105.0, 105.51], [109.0, 109.65], [111.0, 112.77], [116.0, 116.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 1.26, 0.66, 0.48, 1.09, 0.03, 0.96, 0.54, 1.01, 1.52, 0.6, 0.41, 2.2, 0.33, 1.85, 1.55, 0.88, 0.73, 0.94, 0.54, 0.52, 1.24, 0.85, 0.51, 0.65, 1.77, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/-2KGPYEFnsU_filtered.json b/annotations_filtered/-2KGPYEFnsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc5f9d2288921cfa708683de7b5429a18c6efc1 --- /dev/null +++ b/annotations_filtered/-2KGPYEFnsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.39], [15.0, 16.73], [17.0, 17.9], [19.0, 20.11], [24.0, 24.53], [25.0, 25.76], [29.0, 33.12], [38.0, 39.55], [41.0, 43.04], [44.0, 44.71], [46.0, 47.39], [50.0, 50.03], [52.0, 53.38], [55.0, 56.1], [59.0, 60.71], [66.0, 66.9], [73.0, 73.94], [78.0, 78.9], [81.0, 80.79], [110.0, 110.1], [116.0, 117.9], [120.0, 119.8], [125.0, 127.04], [129.0, 129.41], [132.0, 132.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.73, 0.9, 1.11, 0.53, 0.76, 4.12, 1.55, 2.04, 0.71, 1.39, 0.03, 1.38, 1.1, 1.71, 0.9, 0.94, 0.9, -0.21, 0.1, 1.9, -0.2, 2.04, 0.41, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/-2QFIXEHnOY_filtered.json b/annotations_filtered/-2QFIXEHnOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea4b135d467c6ccda9f2a044d3826870c6124d67 --- /dev/null +++ b/annotations_filtered/-2QFIXEHnOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.11], [19.0, 22.35], [24.0, 31.28], [33.0, 33.39], [34.0, 58.75], [59.0, 68.89]], "keep_status": [true, true, true, false, true, true], "silence_prob": [29.59, 29.9, 28.84, 0.0, 29.2, 29.4], "audiomae_on_audioset": [[["music", 34.03], ["buzz", 18.87], ["hum", 9.34]], [["hum", 17.0], ["mains hum", 12.84], ["throbbing", 7.47]], [["fly, housefly", 16.88], ["buzz", 13.34], ["mosquito", 12.24]], null, [["buzz", 13.81], ["hum", 12.07], ["electric shaver, electric razor", 6.64]], [["hum", 22.83], ["mains hum", 10.69], ["fly, housefly", 8.24]]], "duration": [10.11, 3.35, 7.28, 0.39, 24.75, 9.89]} \ No newline at end of file diff --git a/annotations_filtered/-37Mhsak-XI_filtered.json b/annotations_filtered/-37Mhsak-XI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..825f02856c3bd93fc5abae58789e7652f523355a --- /dev/null +++ b/annotations_filtered/-37Mhsak-XI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.73], [48.0, 65.79], [68.0, 86.9], [88.0, 96.03], [97.0, 119.35], [120.0, 123.89], [125.0, 127.58]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [0.0, 31.97, 35.22, 58.05, 45.75, 58.98, 46.79], "audiomae_on_audioset": [null, [["music", 75.5], ["theremin", 5.06], ["scary music", 3.28]], [["music", 40.89], ["speech", 25.7], ["boing", 12.51]], null, [["music", 36.75], ["guitar", 18.42], ["plucked string instrument", 8.13]], null, [["music", 51.17], ["boing", 10.19], ["didgeridoo", 3.32]]], "duration": [0.73, 17.79, 18.9, 8.03, 22.35, 3.89, 2.58]} \ No newline at end of file diff --git a/annotations_filtered/-3KCgSpt3hU_filtered.json b/annotations_filtered/-3KCgSpt3hU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b7b6a230d1c70b0fcfa7b0a432562f47b648446 --- /dev/null +++ b/annotations_filtered/-3KCgSpt3hU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.26], [2.0, 3.81], [7.0, 6.88], [11.0, 10.98], [14.0, 16.56], [21.0, 21.47], [28.0, 28.24], [31.0, 32.36], [36.0, 37.34], [39.0, 40.07], [44.0, 46.47], [48.0, 48.44], [53.0, 54.99], [56.0, 56.88], [57.0, 58.53], [66.0, 68.28], [71.0, 72.1], [73.0, 73.55], [74.0, 78.63], [81.0, 81.43], [83.0, 84.79], [86.0, 86.05], [90.0, 91.77], [95.0, 95.66], [99.0, 100.94], [102.0, 103.57], [105.0, 105.85], [107.0, 108.28], [111.0, 112.83], [114.0, 119.4], [120.0, 121.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.81, -0.12, -0.02, 2.56, 0.47, 0.24, 1.36, 1.34, 1.07, 2.47, 0.44, 1.99, 0.88, 1.53, 2.28, 1.1, 0.55, 4.63, 0.43, 1.79, 0.05, 1.77, 0.66, 1.94, 1.57, 0.85, 1.28, 1.83, 5.4, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/-3RMOO6mHr4_filtered.json b/annotations_filtered/-3RMOO6mHr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8aae4e9a3a3ae01a1da02e740085ed00b6a2ee --- /dev/null +++ b/annotations_filtered/-3RMOO6mHr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.24], [33.0, 32.98], [38.0, 37.61], [39.0, 39.99], [47.0, 49.03], [49.0, 49.08], [78.0, 81.3], [89.0, 90.56], [99.0, 113.17]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.33, 0.0, 30.81, 0.0, 30.68], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 36.74], ["moo", 21.51], ["cattle, bovinae", 13.9]], null, [["music", 20.01], ["moo", 13.1], ["speech", 11.05]], null, [["music", 72.64], ["electronic music", 5.15], ["techno", 3.8]]], "duration": [0.24, -0.02, -0.39, 0.99, 2.03, 0.08, 3.3, 1.56, 14.17]} \ No newline at end of file diff --git a/annotations_filtered/-3mo5CqjvWs_filtered.json b/annotations_filtered/-3mo5CqjvWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2f9f2ae638168dbea15d520823e89a73073ecb9 --- /dev/null +++ b/annotations_filtered/-3mo5CqjvWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [7.0, 6.89], [9.0, 8.85], [25.0, 25.24], [28.0, 27.68], [31.0, 31.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.22, -0.11, -0.15, 0.24, -0.32, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/-3ywc_7_IE8_filtered.json b/annotations_filtered/-3ywc_7_IE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba7751024ef89f0bcf6f5e6f04edc8cc90c2a43d --- /dev/null +++ b/annotations_filtered/-3ywc_7_IE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.68], [19.0, 37.59], [41.0, 41.98], [49.0, 63.66], [67.0, 114.02], [115.0, 123.55], [126.0, 126.84], [134.0, 134.45], [136.0, 137.25], [139.0, 138.96], [144.0, 144.83], [145.0, 145.47], [156.0, 156.44], [157.0, 157.18], [158.0, 158.57], [160.0, 161.0], [168.0, 168.49], [171.0, 173.43], [174.0, 176.01]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.31, 31.05, 0.0, 31.15, 0.0, 32.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.9], "audiomae_on_audioset": [[["cacophony", 9.36], ["fly, housefly", 5.02], ["cheering", 4.37]], [["fly, housefly", 54.14], ["insect", 15.95], ["bee, wasp, etc.", 11.82]], null, [["bee, wasp, etc.", 42.33], ["fly, housefly", 26.81], ["insect", 13.73]], null, [["speech", 21.02], ["whack, thwack", 12.44], ["livestock, farm animals, working animals", 5.97]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 18.59, 0.98, 14.66, 47.02, 8.55, 0.84, 0.45, 1.25, -0.04, 0.83, 0.47, 0.44, 0.18, 0.57, 1.0, 0.49, 2.43, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/-4GsCEopbd4_filtered.json b/annotations_filtered/-4GsCEopbd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a774e8bd703c485f4fe3eed127d9a614c58a7f0f --- /dev/null +++ b/annotations_filtered/-4GsCEopbd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 52.84], [53.0, 63.14], [64.0, 81.58], [83.0, 94.9], [97.0, 100.3], [102.0, 103.0], [104.0, 106.0], [107.0, 108.97], [110.0, 120.66], [123.0, 130.13], [132.0, 133.24], [137.0, 137.56], [139.0, 139.11], [139.0, 143.53], [144.0, 171.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [69.47, 98.51, 99.96, 100.0, 99.16, 0.0, 99.87, 0.0, 37.81, 35.33, 0.0, 0.0, 0.0, 32.88, 30.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 57.7], ["music", 12.4], ["theremin", 8.34]], [["speech", 61.66], ["explosion", 7.3], ["firecracker", 6.96]], null, null, null, [["speech", 42.44], ["fart", 13.31], ["explosion", 10.21]], [["speech", 52.19], ["fly, housefly", 9.28], ["music", 8.03]]], "duration": [20.84, 10.14, 17.58, 11.9, 3.3, 1.0, 2.0, 1.97, 10.66, 7.13, 1.24, 0.56, 0.11, 4.53, 27.59]} \ No newline at end of file diff --git a/annotations_filtered/-4Q-MS_oFkw_filtered.json b/annotations_filtered/-4Q-MS_oFkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..174beb556966243d497df8d54c4afff64406d762 --- /dev/null +++ b/annotations_filtered/-4Q-MS_oFkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.03], [13.0, 13.14], [16.0, 19.82], [24.0, 24.0], [24.0, 25.22], [28.0, 31.28], [33.0, 45.86], [48.0, 50.08], [53.0, 54.19], [57.0, 67.07], [72.0, 72.99], [73.0, 86.34], [99.0, 113.97], [118.0, 125.14]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 93.6, 0.0, 0.0, 51.88, 43.56, 93.76, 0.0, 81.0, 0.0, 48.31, 42.06, 33.06], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.94], ["synthesizer", 14.42], ["theremin", 3.43]], null, null, null, null, [["music", 47.22], ["speech", 21.31], ["theremin", 7.97]], [["music", 46.21], ["theremin", 24.05], ["synthesizer", 4.34]], [["music", 29.76], ["foghorn", 27.27], ["brass instrument", 3.53]]], "duration": [0.03, 0.14, 3.82, 0.0, 1.22, 3.28, 12.86, 2.08, 1.19, 10.07, 0.99, 13.34, 14.97, 7.14]} \ No newline at end of file diff --git a/annotations_filtered/-4QqksHXUCc_filtered.json b/annotations_filtered/-4QqksHXUCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8593888cac01b1ba902c37d433c4154cf580def --- /dev/null +++ b/annotations_filtered/-4QqksHXUCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.91], [8.0, 13.36], [19.0, 20.43], [22.0, 24.17], [27.0, 27.38], [43.0, 46.65], [52.0, 57.62], [58.0, 61.52], [66.0, 68.44], [72.0, 72.52], [76.0, 77.55], [90.0, 89.78], [99.0, 100.2], [107.0, 107.87], [119.0, 119.97], [121.0, 122.76], [123.0, 125.02]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 34.59, 0.0, 36.53, 0.0, 32.91, 37.86, 36.06, 34.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.59], "audiomae_on_audioset": [null, [["music", 55.86], ["throbbing", 11.97], ["electronic music", 4.41]], null, [["hum", 30.96], ["throbbing", 30.29], ["music", 20.06]], null, [["music", 59.22], ["hum", 9.81], ["throbbing", 5.74]], [["music", 60.68], ["didgeridoo", 4.99], ["moo", 3.55]], [["music", 35.65], ["speech", 24.35], ["hum", 4.25]], [["fly, housefly", 22.19], ["music", 18.42], ["insect", 14.12]], null, null, null, null, null, null, null, [["music", 23.99], ["boing", 15.45], ["didgeridoo", 13.58]]], "duration": [0.91, 5.36, 1.43, 2.17, 0.38, 3.65, 5.62, 3.52, 2.44, 0.52, 1.55, -0.22, 1.2, 0.87, 0.97, 1.76, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/-4_rMqeyOJY_filtered.json b/annotations_filtered/-4_rMqeyOJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e99eee6900b51dda247f6c7a9e5bcb29e17e7405 --- /dev/null +++ b/annotations_filtered/-4_rMqeyOJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [7.0, 13.02], [14.0, 14.57], [15.0, 16.07], [17.0, 18.4], [19.0, 20.65], [24.0, 28.92], [31.0, 32.14], [33.0, 35.72], [36.0, 37.72], [45.0, 46.35], [51.0, 51.63], [55.0, 55.59], [60.0, 60.86], [63.0, 63.73], [64.0, 64.4], [68.0, 69.03], [78.0, 79.19], [80.0, 85.9], [88.0, 89.72], [92.0, 93.21], [95.0, 107.42], [109.0, 113.54], [114.0, 121.71], [123.0, 124.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 45.72, 37.88, 43.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.89], ["frog", 5.36], ["insect", 3.47]], [["speech", 27.14], ["dial tone", 23.51], ["busy signal", 6.93]], [["speech", 51.05], ["throat clearing", 5.81], ["noise", 4.84]], null], "duration": [0.99, 6.02, 0.57, 1.07, 1.4, 1.65, 4.92, 1.14, 2.72, 1.72, 1.35, 0.63, 0.59, 0.86, 0.73, 0.4, 1.03, 1.19, 5.9, 1.72, 1.21, 12.42, 4.54, 7.71, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/-5798-VRVYA_filtered.json b/annotations_filtered/-5798-VRVYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56f85f8de904f5593b49aacf2bf0b6db133a1312 --- /dev/null +++ b/annotations_filtered/-5798-VRVYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [5.0, 5.26], [6.0, 6.29], [9.0, 11.03], [11.0, 11.84], [14.0, 14.05], [17.0, 18.25], [19.0, 20.36], [21.0, 21.34], [23.0, 24.06], [27.0, 27.14], [28.0, 28.86], [30.0, 30.65], [32.0, 33.98], [37.0, 37.86], [39.0, 39.02], [40.0, 40.34], [44.0, 44.91], [46.0, 47.51], [48.0, 48.02], [49.0, 50.72], [52.0, 52.76], [54.0, 54.77], [56.0, 57.01], [58.0, 59.48], [60.0, 60.54], [62.0, 66.66], [68.0, 72.22], [73.0, 74.19], [75.0, 76.18], [77.0, 79.98], [83.0, 84.57], [87.0, 90.64], [92.0, 97.43], [98.0, 101.38], [102.0, 106.74], [107.0, 110.03], [112.0, 146.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 36.03, 0.0, 0.0, 73.97, 0.0, 83.52, 48.23, 85.54, 51.5, 43.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 16.08], ["domestic animals, pets", 10.18], ["hum", 10.12]], null, null, null, null, null, [["hum", 47.0], ["mains hum", 28.83], ["speech", 6.35]], null, null, [["speech", 62.57], ["hum", 6.04], ["mains hum", 3.86]], null], "duration": [0.92, 0.26, 0.29, 2.03, 0.84, 0.05, 1.25, 1.36, 0.34, 1.06, 0.14, 0.86, 0.65, 1.98, 0.86, 0.02, 0.34, 0.91, 1.51, 0.02, 1.72, 0.76, 0.77, 1.01, 1.48, 0.54, 4.66, 4.22, 1.19, 1.18, 2.98, 1.57, 3.64, 5.43, 3.38, 4.74, 3.03, 34.74]} \ No newline at end of file diff --git a/annotations_filtered/-5Pku48YPFo_filtered.json b/annotations_filtered/-5Pku48YPFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37250ff25e1e76f7f3766b85d8ef2e2d74f88cc0 --- /dev/null +++ b/annotations_filtered/-5Pku48YPFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [13.0, 17.25], [28.0, 31.53], [35.0, 40.85], [43.0, 93.6], [97.0, 102.05], [102.0, 102.78], [103.0, 104.14], [106.0, 109.41], [110.0, 118.64]], "keep_status": [false, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.91, 38.11, 30.81, 0.0, 32.26, 0.0, 0.0, 35.07, 75.72], "audiomae_on_audioset": [null, [["speech", 22.11], ["screaming", 17.24], ["thunk", 10.79]], [["whale vocalization", 19.7], ["dog", 10.82], ["music", 9.72]], [["music", 69.01], ["musical instrument", 4.65], ["domestic animals, pets", 2.95]], null, [["speech", 37.14], ["vehicle", 17.56], ["radio", 8.43]], null, null, [["speech", 51.87], ["vehicle", 15.02], ["hum", 3.86]], null], "duration": [0.4, 4.25, 3.53, 5.85, 50.6, 5.05, 0.78, 1.14, 3.41, 8.64]} \ No newline at end of file diff --git a/annotations_filtered/-5Rohhkg-7k_filtered.json b/annotations_filtered/-5Rohhkg-7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5672a5ee2e27a067bff85540da244505872ed47f --- /dev/null +++ b/annotations_filtered/-5Rohhkg-7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [8.0, 9.31], [10.0, 11.06], [12.0, 12.31], [14.0, 14.39], [15.0, 15.69], [16.0, 16.92], [19.0, 19.33], [20.0, 20.76], [24.0, 25.17], [27.0, 29.67], [33.0, 33.0], [37.0, 37.84], [39.0, 39.34], [40.0, 41.3], [42.0, 44.2], [46.0, 46.41], [49.0, 48.78], [51.0, 52.12], [53.0, 53.59], [56.0, 57.35], [59.0, 60.12], [61.0, 61.94], [62.0, 62.77], [64.0, 65.53], [67.0, 68.99], [72.0, 72.82], [75.0, 75.69], [77.0, 77.3], [79.0, 80.42], [84.0, 84.3], [85.0, 85.9], [87.0, 87.59], [89.0, 93.24], [95.0, 96.13], [97.0, 97.95], [100.0, 103.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 1.31, 1.06, 0.31, 0.39, 0.69, 0.92, 0.33, 0.76, 1.17, 2.67, 0.0, 0.84, 0.34, 1.3, 2.2, 0.41, -0.22, 1.12, 0.59, 1.35, 1.12, 0.94, 0.77, 1.53, 1.99, 0.82, 0.69, 0.3, 1.42, 0.3, 0.9, 0.59, 4.24, 1.13, 0.95, 3.76]} \ No newline at end of file diff --git a/annotations_filtered/-5be_UPkLRw_filtered.json b/annotations_filtered/-5be_UPkLRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ded56415ea66a13ffdf809921497191a392141e --- /dev/null +++ b/annotations_filtered/-5be_UPkLRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [6.0, 6.29], [9.0, 12.5], [14.0, 16.61], [19.0, 20.55], [24.0, 30.74], [31.0, 32.48], [34.0, 33.76], [35.0, 35.63], [36.0, 40.47], [42.0, 44.19], [45.0, 46.9], [49.0, 49.62], [51.0, 52.59], [53.0, 55.44], [58.0, 58.31], [60.0, 60.81], [63.0, 63.42], [65.0, 65.94], [68.0, 68.39], [70.0, 70.63], [72.0, 72.94], [74.0, 75.36], [77.0, 77.63], [79.0, 79.93], [80.0, 83.71], [84.0, 87.1], [89.0, 89.45], [92.0, 91.83], [93.0, 102.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 67.38, 99.99, 0.0, 99.62, 0.0, 0.0, 0.0, 100.0, 99.8, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 100.0, 0.0, 0.0, 99.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.06, 0.29, 3.5, 2.61, 1.55, 6.74, 1.48, -0.24, 0.63, 4.47, 2.19, 1.9, 0.62, 1.59, 2.44, 0.31, 0.81, 0.42, 0.94, 0.39, 0.63, 0.94, 1.36, 0.63, 0.93, 3.71, 3.1, 0.45, -0.17, 9.32]} \ No newline at end of file diff --git a/annotations_filtered/-5twCD8tAMc_filtered.json b/annotations_filtered/-5twCD8tAMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..191e5ec7d61aece63be80228ed9569155f898788 --- /dev/null +++ b/annotations_filtered/-5twCD8tAMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.65], [25.0, 25.08], [27.0, 28.24], [29.0, 30.91], [35.0, 35.61], [38.0, 42.33], [44.0, 75.29], [76.0, 76.72], [81.0, 89.38]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [33.09, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 30.12], "audiomae_on_audioset": [[["music", 83.83], ["theremin", 1.62], ["synthesizer", 1.3]], null, null, null, null, [["boat, water vehicle", 16.83], ["music", 14.4], ["vehicle", 11.07]], null, null, [["music", 72.52], ["musical instrument", 4.87], ["cacophony", 2.86]]], "duration": [15.65, 0.08, 1.24, 1.91, 0.61, 4.33, 31.29, 0.72, 8.38]} \ No newline at end of file diff --git a/annotations_filtered/-64q4HpZyaY_filtered.json b/annotations_filtered/-64q4HpZyaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa66f9963d973564c636f5b996bf6a05c275485 --- /dev/null +++ b/annotations_filtered/-64q4HpZyaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.61], [12.0, 12.16], [13.0, 79.49], [80.0, 109.46], [111.0, 112.77], [116.0, 117.36], [119.0, 124.24]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [31.4, 0.0, 0.0, 69.07, 0.0, 0.0, 63.96], "audiomae_on_audioset": [[["fly, housefly", 24.9], ["mains hum", 24.38], ["hum", 14.07]], null, null, null, null, null, null], "duration": [7.61, 0.16, 66.49, 29.46, 1.77, 1.36, 5.24]} \ No newline at end of file diff --git a/annotations_filtered/-6fuDrAmhNc_filtered.json b/annotations_filtered/-6fuDrAmhNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c45d75c044bc791d280bf5cef48105d8a8a4353 --- /dev/null +++ b/annotations_filtered/-6fuDrAmhNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.13], [27.0, 28.88], [32.0, 32.17], [33.0, 38.03], [38.0, 40.19], [41.0, 44.02], [45.0, 46.45], [47.0, 47.63], [49.0, 49.91], [54.0, 54.67], [55.0, 56.32], [58.0, 58.46], [61.0, 61.74], [62.0, 63.98], [65.0, 65.4], [69.0, 69.99], [73.0, 73.89], [75.0, 76.54], [78.0, 84.0], [88.0, 97.07], [98.0, 98.78], [103.0, 155.43], [159.0, 179.0]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.01, 0.0, 0.0, 43.45, 32.83, 35.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 31.62, 0.0, 0.0, 34.35], "audiomae_on_audioset": [[["hum", 40.54], ["mains hum", 26.25], ["speech", 5.13]], null, null, [["hum", 22.65], ["mains hum", 17.99], ["music", 17.63]], [["music", 31.89], ["speech", 15.71], ["cattle, bovinae", 7.73]], [["music", 29.62], ["foghorn", 13.93], ["speech", 6.49]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.31], ["theremin", 11.38], ["hum", 2.41]], [["music", 53.67], ["brass instrument", 12.72], ["musical instrument", 8.37]], null, null, [["music", 40.6], ["didgeridoo", 12.31], ["gong", 10.97]]], "duration": [2.13, 1.88, 0.17, 5.03, 2.19, 3.02, 1.45, 0.63, 0.91, 0.67, 1.32, 0.46, 0.74, 1.98, 0.4, 0.99, 0.89, 1.54, 6.0, 9.07, 0.78, 52.43, 20.0]} \ No newline at end of file diff --git a/annotations_filtered/-7-2-088LnM_filtered.json b/annotations_filtered/-7-2-088LnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3037e77d9123ada38a370e4acab1bf677751cae0 --- /dev/null +++ b/annotations_filtered/-7-2-088LnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.2], [23.0, 22.92], [23.0, 25.52], [28.0, 30.13], [35.0, 36.71], [40.0, 42.08], [44.0, 45.2], [45.0, 46.09], [46.0, 48.91], [49.0, 49.25], [50.0, 50.72], [51.0, 52.47], [53.0, 57.54], [59.0, 67.63], [70.0, 72.08], [72.0, 74.56], [82.0, 82.93], [87.0, 99.28], [99.0, 99.5], [100.0, 100.01], [100.0, 100.45], [101.0, 109.46]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.47, 36.04, 0.0, 97.11, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 71.14, 67.63, 98.99, 43.85, 0.0, 37.46, 0.0, 0.0, 0.0, 42.74], "audiomae_on_audioset": [null, null, [["whale vocalization", 16.24], ["boing", 16.19], ["moo", 10.98]], [["speech", 72.48], ["applause", 5.84], ["radio", 2.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.7], ["burping, eructation", 2.31], ["percussion", 1.49]], null, [["music", 60.25], ["groan", 6.88], ["grunt", 5.85]], null, null, null, [["gasp", 19.11], ["speech", 13.68], ["breaking", 11.58]]], "duration": [0.2, -0.08, 2.52, 2.13, 1.71, 2.08, 1.2, 1.09, 2.91, 0.25, 0.72, 1.47, 4.54, 8.63, 2.08, 2.56, 0.93, 12.28, 0.5, 0.01, 0.45, 8.46]} \ No newline at end of file diff --git a/annotations_filtered/-7-C6lSAfOs_filtered.json b/annotations_filtered/-7-C6lSAfOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7891fb6135ecad07780535974d6536de67ae216 --- /dev/null +++ b/annotations_filtered/-7-C6lSAfOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 76.38], [77.0, 76.99], [79.0, 79.69], [80.0, 81.9], [83.0, 83.78], [85.0, 103.96], [107.0, 107.38], [112.0, 113.68]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.1], ["synthesizer", 6.42], ["musical instrument", 3.74]], null, null], "duration": [46.38, -0.01, 0.69, 1.9, 0.78, 18.96, 0.38, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/-78FgmNwyD4_filtered.json b/annotations_filtered/-78FgmNwyD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9b08023180659798b5ad494b530bc0a1387acc --- /dev/null +++ b/annotations_filtered/-78FgmNwyD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.16], [16.0, 16.8], [36.0, 36.1], [36.0, 37.08], [39.0, 41.34], [48.0, 48.9], [50.0, 50.38], [56.0, 56.52], [58.0, 58.78], [64.0, 64.3], [66.0, 66.85], [67.0, 76.86], [82.0, 82.63], [83.0, 83.62], [84.0, 84.59], [100.0, 101.29], [102.0, 102.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.84], ["groan", 22.6], ["screaming", 2.61]], null, null, null, null, null], "duration": [0.0, 0.16, 0.8, 0.1, 1.08, 2.34, 0.9, 0.38, 0.52, 0.78, 0.3, 0.85, 9.86, 0.63, 0.62, 0.59, 1.29, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/-7Sow81yi24_filtered.json b/annotations_filtered/-7Sow81yi24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4b1a642f3eddad96ac0ab22d9e6bea1f00ecdd --- /dev/null +++ b/annotations_filtered/-7Sow81yi24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.53], [33.0, 38.33], [40.0, 42.58], [44.0, 45.69], [47.0, 63.64], [64.0, 66.07], [67.0, 73.43], [75.0, 76.65], [77.0, 79.95], [81.0, 84.52], [86.0, 89.21], [94.0, 96.35], [100.0, 101.29], [102.0, 103.87], [107.0, 107.33], [109.0, 110.39], [114.0, 124.66]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 49.92, 54.9, 0.0, 47.94, 35.61, 38.42, 0.0, 43.15, 38.54, 36.11, 45.14, 0.0, 0.0, 0.0, 0.0, 28.26], "audiomae_on_audioset": [null, [["music", 25.69], ["hum", 11.38], ["speech", 11.19]], null, null, [["hum", 39.29], ["mains hum", 20.44], ["music", 15.13]], [["gong", 43.33], ["hum", 9.03], ["singing bowl", 6.05]], [["hum", 50.46], ["throbbing", 24.51], ["mains hum", 10.71]], null, [["music", 41.92], ["mains hum", 17.04], ["hum", 14.08]], [["music", 40.52], ["mains hum", 12.71], ["hum", 12.62]], [["hum", 25.29], ["music", 24.57], ["mains hum", 18.16]], [["music", 60.94], ["theremin", 7.71], ["musical instrument", 3.84]], null, null, null, null, [["music", 56.16], ["vehicle", 7.08], ["car", 4.84]]], "duration": [0.53, 5.33, 2.58, 1.69, 16.64, 2.07, 6.43, 1.65, 2.95, 3.52, 3.21, 2.35, 1.29, 1.87, 0.33, 1.39, 10.66]} \ No newline at end of file diff --git a/annotations_filtered/-7cV5cWQmxg_filtered.json b/annotations_filtered/-7cV5cWQmxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0503a47a9789adfbca6f2006310e7ee8a9edd172 --- /dev/null +++ b/annotations_filtered/-7cV5cWQmxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [8.0, 8.5], [9.0, 9.83], [17.0, 18.98], [21.0, 21.37], [22.0, 23.33], [27.0, 28.56], [32.0, 33.91], [34.0, 38.38], [39.0, 40.36], [42.0, 61.25], [64.0, 66.39], [68.0, 73.47], [80.0, 79.89], [80.0, 80.2], [88.0, 94.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.01, 0.0, 41.98, 94.81, 37.09, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 28.43], ["music", 28.37], ["synthesizer", 5.19]], null, [["mosquito", 27.65], ["fly, housefly", 20.31], ["insect", 8.7]], null, [["speech", 72.72], ["stomach rumble", 4.04], ["animal", 2.28]], null, null, [["speech", 19.75], ["music", 18.08], ["throbbing", 13.72]]], "duration": [0.34, 0.5, 0.83, 1.98, 0.37, 1.33, 1.56, 1.91, 4.38, 1.36, 19.25, 2.39, 5.47, -0.11, 0.2, 6.09]} \ No newline at end of file diff --git a/annotations_filtered/-7krYJUfFv4_filtered.json b/annotations_filtered/-7krYJUfFv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f51302be483ed5fc9fc139adeae2180bbc87126 --- /dev/null +++ b/annotations_filtered/-7krYJUfFv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.58], [9.0, 10.77], [11.0, 11.94], [13.0, 14.71], [15.0, 16.53], [18.0, 19.45], [20.0, 20.78], [31.0, 31.26], [34.0, 34.37], [41.0, 41.52], [42.0, 42.4], [43.0, 43.65], [45.0, 45.25], [47.0, 47.73], [49.0, 49.59], [50.0, 50.63], [53.0, 54.16], [56.0, 56.03], [62.0, 63.31], [65.0, 65.69], [68.0, 68.22], [81.0, 81.48], [92.0, 92.75], [106.0, 107.37], [109.0, 109.34], [110.0, 111.01], [112.0, 112.08], [113.0, 113.48], [114.0, 114.15], [119.0, 119.03], [124.0, 126.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.77, 0.94, 1.71, 1.53, 1.45, 0.78, 0.26, 0.37, 0.52, 0.4, 0.65, 0.25, 0.73, 0.59, 0.63, 1.16, 0.03, 1.31, 0.69, 0.22, 0.48, 0.75, 1.37, 0.34, 1.01, 0.08, 0.48, 0.15, 0.03, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/-7mzQx0ebqk_filtered.json b/annotations_filtered/-7mzQx0ebqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c98ba98248ec2213a7d6e0a8ce39f81ef77b5f7 --- /dev/null +++ b/annotations_filtered/-7mzQx0ebqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [10.0, 10.27], [14.0, 14.88], [19.0, 20.17], [23.0, 23.01], [24.0, 28.61], [32.0, 34.43], [43.0, 43.29], [45.0, 45.52], [49.0, 49.55], [54.0, 54.06], [62.0, 63.85], [65.0, 72.45], [75.0, 79.84], [82.0, 82.54], [86.0, 89.4], [96.0, 97.44], [98.0, 100.3], [126.0, 125.73], [128.0, 127.7], [131.0, 132.16], [133.0, 133.22], [135.0, 136.95], [141.0, 141.61], [144.0, 143.95], [145.0, 148.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 60.05, 0.0, 94.22, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7], "audiomae_on_audioset": [null, null, null, null, null, [["singing bowl", 23.82], ["music", 21.45], ["burping, eructation", 15.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.27, 0.88, 1.17, 0.01, 4.61, 2.43, 0.29, 0.52, 0.55, 0.06, 1.85, 7.45, 4.84, 0.54, 3.4, 1.44, 2.3, -0.27, -0.3, 1.16, 0.22, 1.95, 0.61, -0.05, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/-85ubSkzSWg_filtered.json b/annotations_filtered/-85ubSkzSWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba433da5b7ae7acaea652954bd25d925d1e4605b --- /dev/null +++ b/annotations_filtered/-85ubSkzSWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.99], [15.0, 14.64], [16.0, 20.71], [22.0, 22.96], [23.0, 23.62], [24.0, 24.85], [25.0, 27.18], [28.0, 30.72], [32.0, 33.2], [33.0, 34.4], [36.0, 36.54], [38.0, 40.76], [42.0, 42.84], [44.0, 45.91], [48.0, 50.75], [56.0, 66.06]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 38.46, 0.0, 0.0, 0.0, 35.38, 34.84, 0.0, 0.0, 0.0, 33.42, 0.0, 0.0, 42.11, 33.01], "audiomae_on_audioset": [null, null, [["music", 56.86], ["musical instrument", 5.27], ["synthesizer", 3.65]], null, null, null, [["speech", 53.41], ["music", 20.83], ["radio", 4.67]], [["music", 21.99], ["mains hum", 19.4], ["hum", 13.14]], null, null, null, [["music", 32.01], ["speech", 25.74], ["radio", 9.71]], null, null, [["hum", 30.98], ["speech", 20.05], ["music", 8.82]], [["hum", 22.59], ["sidetone", 20.95], ["mains hum", 18.14]]], "duration": [1.99, -0.36, 4.71, 0.96, 0.62, 0.85, 2.18, 2.72, 1.2, 1.4, 0.54, 2.76, 0.84, 1.91, 2.75, 10.06]} \ No newline at end of file diff --git a/annotations_filtered/-8ajIeIeJpY_filtered.json b/annotations_filtered/-8ajIeIeJpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a7b5ed9d7fc58d336376fc01c0fbb6be058bac --- /dev/null +++ b/annotations_filtered/-8ajIeIeJpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.89], [3.0, 5.76], [6.0, 6.86], [8.0, 8.73], [14.0, 15.4], [19.0, 19.99], [22.0, 23.03], [24.0, 24.53], [26.0, 26.33], [34.0, 33.86], [35.0, 35.43], [36.0, 36.31], [37.0, 37.89], [38.0, 39.29], [42.0, 43.29], [44.0, 44.58], [45.0, 45.4], [46.0, 46.4], [48.0, 48.32], [57.0, 57.15], [58.0, 59.56], [60.0, 61.32], [63.0, 63.66], [68.0, 68.47], [74.0, 76.0], [77.0, 78.85], [81.0, 85.8], [86.0, 86.41], [89.0, 90.75], [91.0, 91.93], [92.0, 92.62], [93.0, 93.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.69], ["radio", 21.67], ["croak", 11.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 2.76, 0.86, 0.73, 1.4, 0.99, 1.03, 0.53, 0.33, -0.14, 0.43, 0.31, 0.89, 1.29, 1.29, 0.58, 0.4, 0.4, 0.32, 0.15, 1.56, 1.32, 0.66, 0.47, 2.0, 1.85, 4.8, 0.41, 1.75, 0.93, 0.62, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/-98BSUhcZtY_filtered.json b/annotations_filtered/-98BSUhcZtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a82418a39a099355e6fa97b2fa85c83df6601f9 --- /dev/null +++ b/annotations_filtered/-98BSUhcZtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.95], [23.0, 24.24], [33.0, 34.2], [39.0, 41.27], [43.0, 44.42], [47.0, 47.7]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 47.69], ["mains hum", 18.88], ["throbbing", 10.53]], null, null], "duration": [-0.05, 1.24, 1.2, 2.27, 1.42, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/-9DrPi3ki0g_filtered.json b/annotations_filtered/-9DrPi3ki0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0ecb066df77a66a8b85fa917e71f1a64ecf188b --- /dev/null +++ b/annotations_filtered/-9DrPi3ki0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 20.28], [22.0, 45.76]], "keep_status": [false, true], "silence_prob": [34.74, 33.61], "audiomae_on_audioset": [[["music", 49.81], ["theremin", 33.23], ["vehicle", 1.7]], [["music", 44.88], ["brass instrument", 11.34], ["trombone", 7.67]]], "duration": [8.28, 23.76]} \ No newline at end of file diff --git a/annotations_filtered/-9IgLueodZA_filtered.json b/annotations_filtered/-9IgLueodZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c66856930217ffa3dc689ef22d47219dc0ee943d --- /dev/null +++ b/annotations_filtered/-9IgLueodZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [7.0, 9.44], [10.0, 11.7], [15.0, 15.26], [24.0, 24.09], [25.0, 27.26], [28.0, 33.27], [37.0, 37.32], [38.0, 39.36], [41.0, 47.78], [50.0, 53.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.28, 0.0, 0.0, 0.0, 65.44, 69.74, 0.0, 0.0, 100.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 2.44, 1.7, 0.26, 0.09, 2.26, 5.27, 0.32, 1.36, 6.78, 3.38]} \ No newline at end of file diff --git a/annotations_filtered/-9P7Ge1KmTY_filtered.json b/annotations_filtered/-9P7Ge1KmTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0466cb21a99f7fafe429ff28d37bddf60faec5be --- /dev/null +++ b/annotations_filtered/-9P7Ge1KmTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [5.0, 4.7], [5.0, 5.78], [7.0, 8.72], [32.0, 33.22], [38.0, 39.5], [41.0, 42.06], [47.0, 48.24], [51.0, 50.75], [51.0, 52.86], [54.0, 54.65], [65.0, 65.82], [69.0, 68.99], [76.0, 76.65], [79.0, 78.98], [81.0, 80.94], [84.0, 85.06], [87.0, 89.92], [91.0, 91.72], [92.0, 93.43], [95.0, 97.58], [106.0, 107.76], [111.0, 111.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0, 96.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.48], ["telephone", 13.06], ["hum", 5.47]], null, null, null, null, null], "duration": [0.02, -0.3, 0.78, 1.72, 1.22, 1.5, 1.06, 1.24, -0.25, 1.86, 0.65, 0.82, -0.01, 0.65, -0.02, -0.06, 1.06, 2.92, 0.72, 1.43, 2.58, 1.76, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/-A-fBbIXbPo_filtered.json b/annotations_filtered/-A-fBbIXbPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a48765d3077b8696daa75aa776068712d46f8ee6 --- /dev/null +++ b/annotations_filtered/-A-fBbIXbPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.78], [13.0, 14.96], [16.0, 20.09], [22.0, 24.02], [25.0, 26.28], [28.0, 33.52], [36.0, 40.32], [41.0, 52.84], [54.0, 59.63], [61.0, 71.81], [73.0, 72.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.48, 0.0, 97.73, 100.0, 0.0, 99.99, 99.93, 96.42, 94.07, 74.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [5.78, 1.96, 4.09, 2.02, 1.28, 5.52, 4.32, 11.84, 5.63, 10.81, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/-A9rFt7ITy4_filtered.json b/annotations_filtered/-A9rFt7ITy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce4ae8a9b8e60bfb4c38c86d4b74cba98127033f --- /dev/null +++ b/annotations_filtered/-A9rFt7ITy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 33.86], [36.0, 36.41], [38.0, 39.02], [42.0, 43.14], [45.0, 45.82], [46.0, 47.26], [48.0, 48.44], [50.0, 50.4], [51.0, 51.24], [53.0, 52.89], [58.0, 58.35], [62.0, 62.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 0.41, 1.02, 1.14, 0.82, 1.26, 0.44, 0.4, 0.24, -0.11, 0.35, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/-ASYRiRflDM_filtered.json b/annotations_filtered/-ASYRiRflDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..122eedafc1eb606182c2bb2dfe5f517ecca30508 --- /dev/null +++ b/annotations_filtered/-ASYRiRflDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [5.0, 5.0], [6.0, 6.96], [8.0, 8.68], [10.0, 10.96], [14.0, 14.4], [15.0, 16.77], [19.0, 20.97], [22.0, 22.99], [27.0, 27.23], [28.0, 29.74], [31.0, 33.59], [36.0, 36.83], [37.0, 38.97], [45.0, 45.28], [47.0, 47.46], [49.0, 49.84], [51.0, 51.22], [56.0, 57.87], [58.0, 58.75], [60.0, 60.98], [61.0, 61.99], [64.0, 64.1], [65.0, 65.79], [66.0, 66.6], [68.0, 68.91], [70.0, 71.22], [73.0, 73.03], [82.0, 85.29], [87.0, 87.62], [89.0, 89.21], [104.0, 103.64], [105.0, 106.96], [115.0, 114.78], [116.0, 116.51], [120.0, 120.61], [122.0, 122.93], [124.0, 124.95], [126.0, 127.38], [128.0, 129.19], [130.0, 130.11], [131.0, 131.57], [133.0, 134.27], [136.0, 136.38], [144.0, 144.63], [145.0, 147.6], [150.0, 150.21], [153.0, 153.49], [155.0, 155.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.0, 0.96, 0.68, 0.96, 0.4, 1.77, 1.97, 0.99, 0.23, 1.74, 2.59, 0.83, 1.97, 0.28, 0.46, 0.84, 0.22, 1.87, 0.75, 0.98, 0.99, 0.1, 0.79, 0.6, 0.91, 1.22, 0.03, 3.29, 0.62, 0.21, -0.36, 1.96, -0.22, 0.51, 0.61, 0.93, 0.95, 1.38, 1.19, 0.11, 0.57, 1.27, 0.38, 0.63, 2.6, 0.21, 0.49, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/-AZg55qXj7U_filtered.json b/annotations_filtered/-AZg55qXj7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56f67b60fb7943a1bb1cd2b8011d60fd6e08a86a --- /dev/null +++ b/annotations_filtered/-AZg55qXj7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 61.82], [62.0, 86.7], [88.0, 106.52], [109.0, 152.19], [153.0, 178.44]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.0, 31.48, 0.0, 33.88], "audiomae_on_audioset": [null, null, [["music", 83.76], ["hum", 7.02], ["throbbing", 1.65]], [["music", 65.55], ["synthesizer", 5.15], ["hum", 4.37]], null, [["music", 22.0], ["hum", 20.87], ["speech", 11.7]]], "duration": [0.62, 55.82, 24.7, 18.52, 43.19, 25.44]} \ No newline at end of file diff --git a/annotations_filtered/-AlTccRsRsk_filtered.json b/annotations_filtered/-AlTccRsRsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903e5dfb77dcf3692d88be6f0254c73f162641a9 --- /dev/null +++ b/annotations_filtered/-AlTccRsRsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [8.0, 8.26], [10.0, 10.29], [12.0, 13.53], [14.0, 16.06], [19.0, 28.41], [30.0, 32.31], [40.0, 46.38], [51.0, 52.98], [56.0, 57.01], [60.0, 59.75], [67.0, 67.98], [74.0, 74.83], [76.0, 77.72], [81.0, 81.9], [84.0, 86.1], [89.0, 89.18], [90.0, 90.98], [91.0, 91.2]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.32, 30.62, 46.02, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 57.87], ["didgeridoo", 10.98], ["speech", 8.96]], [["music", 65.97], ["synthesizer", 13.99], ["musical instrument", 5.17]], [["music", 18.28], ["didgeridoo", 6.8], ["hum", 6.12]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.26, 0.29, 1.53, 2.06, 9.41, 2.31, 6.38, 1.98, 1.01, -0.25, 0.98, 0.83, 1.72, 0.9, 2.1, 0.18, 0.98, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/-ArVBL8EgKU_filtered.json b/annotations_filtered/-ArVBL8EgKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbcbe0f1412dbac1e8e96752ef0b4c736c110cef --- /dev/null +++ b/annotations_filtered/-ArVBL8EgKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 53.81], [59.0, 81.4], [85.0, 107.87], [111.0, 110.78], [112.0, 114.15], [116.0, 116.73]], "keep_status": [false, true, true, false, true, false], "silence_prob": [31.32, 30.02, 30.8, 0.0, 31.94, 0.0], "audiomae_on_audioset": [[["music", 67.23], ["throbbing", 9.77], ["hum", 3.68]], [["music", 37.68], ["buzz", 4.27], ["speech", 3.73]], [["music", 56.65], ["theremin", 5.83], ["didgeridoo", 3.89]], null, [["music", 20.95], ["mains hum", 11.66], ["hum", 11.38]], null], "duration": [25.81, 22.4, 22.87, -0.22, 2.15, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/-BOt25-zf8Q_filtered.json b/annotations_filtered/-BOt25-zf8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71891db33efe37ab092c2420a33ecd481c345b52 --- /dev/null +++ b/annotations_filtered/-BOt25-zf8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.49], [11.0, 11.99], [13.0, 13.36], [15.0, 15.7], [23.0, 24.43], [29.0, 29.12], [38.0, 40.31], [43.0, 42.8], [44.0, 49.74], [51.0, 50.95], [52.0, 57.08], [59.0, 61.2], [64.0, 68.2], [69.0, 69.45], [72.0, 77.48], [87.0, 87.56], [89.0, 96.18], [98.0, 99.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 40.7, 0.0, 45.21, 49.18, 40.36, 0.0, 47.39, 0.0, 39.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 53.99], ["speech", 15.3], ["guitar", 5.89]], null, [["music", 51.1], ["didgeridoo", 10.0], ["theremin", 6.33]], [["music", 51.86], ["guitar", 6.97], ["bass guitar", 5.58]], [["cattle, bovinae", 24.9], ["livestock, farm animals, working animals", 24.55], ["moo", 18.7]], null, [["music", 27.41], ["speech", 10.79], ["hum", 5.84]], null, [["mains hum", 55.58], ["hum", 19.35], ["speech", 6.47]], null], "duration": [0.49, 0.99, 0.36, 0.7, 1.43, 0.12, 2.31, -0.2, 5.74, -0.05, 5.08, 2.2, 4.2, 0.45, 5.48, 0.56, 7.18, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/-BUI1BdZz94_filtered.json b/annotations_filtered/-BUI1BdZz94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4677783f399ad9015fdb85485d71f3a9e07de3 --- /dev/null +++ b/annotations_filtered/-BUI1BdZz94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 4.78], [7.0, 9.26], [11.0, 14.44], [16.0, 18.77], [19.0, 22.42], [23.0, 27.73], [29.0, 31.16], [32.0, 43.9], [45.0, 46.33], [47.0, 49.96], [50.0, 50.03], [50.0, 50.23], [51.0, 52.25], [61.0, 61.86], [66.0, 67.61], [70.0, 72.55], [74.0, 74.48], [77.0, 78.19], [78.0, 78.22], [78.0, 80.06], [95.0, 96.23], [98.0, 98.0], [106.0, 109.49], [110.0, 113.54], [116.0, 123.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 52.74, 50.31, 42.62, 57.01, 68.15, 79.76, 61.08, 0.0, 53.34, 0.0, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 33.8, 0.0, 0.0, 39.88, 43.82, 42.02], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 77.86], ["speech", 10.47], ["hum", 2.52]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.93], ["music", 21.64], ["didgeridoo", 9.88]], null, null, null, [["speech", 81.71], ["inside, small room", 2.28], ["hum", 1.83]], null, null, [["music", 43.33], ["didgeridoo", 5.27], ["mains hum", 5.1]], [["music", 35.91], ["didgeridoo", 14.97], ["whale vocalization", 6.16]], [["music", 34.09], ["hum", 13.27], ["gong", 12.95]]], "duration": [0.51, -0.22, 2.26, 3.44, 2.77, 3.42, 4.73, 2.16, 11.9, 1.33, 2.96, 0.03, 0.23, 1.25, 0.86, 1.61, 2.55, 0.48, 1.19, 0.22, 2.06, 1.23, 0.0, 3.49, 3.54, 7.89]} \ No newline at end of file diff --git a/annotations_filtered/-BgZFaMJRxM_filtered.json b/annotations_filtered/-BgZFaMJRxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b97362e90eb6f798daefc7d304a08330545147c9 --- /dev/null +++ b/annotations_filtered/-BgZFaMJRxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.34], [7.0, 7.79], [9.0, 10.56], [15.0, 17.19], [17.0, 18.17], [19.0, 19.72], [21.0, 23.97], [25.0, 28.31], [30.0, 32.85], [43.0, 43.6], [45.0, 45.55], [48.0, 52.08], [56.0, 61.15], [64.0, 65.4], [67.0, 68.32], [69.0, 69.89], [70.0, 72.89], [74.0, 77.5], [81.0, 83.39], [84.0, 104.89], [106.0, 106.46], [107.0, 108.24], [110.0, 111.57], [115.0, 116.75], [120.0, 120.61], [123.0, 124.21], [126.0, 127.99], [130.0, 131.03], [132.0, 134.27], [135.0, 135.68], [136.0, 137.03], [139.0, 141.13], [142.0, 142.92], [146.0, 145.71], [146.0, 147.06], [149.0, 149.44], [152.0, 156.36], [162.0, 163.31], [164.0, 165.11], [168.0, 168.91], [174.0, 174.97], [175.0, 176.34], [177.0, 178.58], [180.0, 179.91]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.75, 0.0, 0.0, 47.98, 0.0, 0.0, 54.43, 50.51, 56.25, 0.0, 0.0, 57.32, 61.67, 0.0, 0.0, 0.0, 39.86, 58.55, 52.51, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["chirp tone", 24.02], ["whale vocalization", 16.52], ["sine wave", 16.23]], null, null, [["music", 31.28], ["whale vocalization", 20.69], ["singing bowl", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.97], ["whale vocalization", 14.45], ["hum", 11.47]], null, null, [["hum", 47.44], ["throbbing", 31.47], ["mains hum", 6.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.27], ["mains hum", 24.35], ["speech", 22.56]], null, null, null, null, null, null, null], "duration": [3.34, 0.79, 1.56, 2.19, 1.17, 0.72, 2.97, 3.31, 2.85, 0.6, 0.55, 4.08, 5.15, 1.4, 1.32, 0.89, 2.89, 3.5, 2.39, 20.89, 0.46, 1.24, 1.57, 1.75, 0.61, 1.21, 1.99, 1.03, 2.27, 0.68, 1.03, 2.13, 0.92, -0.29, 1.06, 0.44, 4.36, 1.31, 1.11, 0.91, 0.97, 1.34, 1.58, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/-BiLCJxpqi4_filtered.json b/annotations_filtered/-BiLCJxpqi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4e84ce4527a128fd88069ab3e7573b1ebbbc340 --- /dev/null +++ b/annotations_filtered/-BiLCJxpqi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 60.37], [62.0, 67.19], [68.0, 69.58], [70.0, 71.46], [73.0, 73.52], [74.0, 75.63]], "keep_status": [true, false, false, false, false, false], "silence_prob": [38.54, 43.9, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 25.44], ["hum", 22.22], ["throbbing", 14.46]], [["hum", 36.73], ["music", 22.02], ["throbbing", 14.96]], null, null, null, null], "duration": [6.37, 5.19, 1.58, 1.46, 0.52, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/-C7Fcg58rZU_filtered.json b/annotations_filtered/-C7Fcg58rZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..719dad02ea935851f70f39c975120de708ad5af6 --- /dev/null +++ b/annotations_filtered/-C7Fcg58rZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.86], [5.0, 19.09], [33.0, 35.87], [46.0, 46.79], [48.0, 48.3], [55.0, 58.13]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 30.24, 40.01, 0.0, 0.0, 34.16], "audiomae_on_audioset": [null, [["music", 48.55], ["throbbing", 17.16], ["hum", 16.5]], [["music", 42.11], ["musical instrument", 6.9], ["synthesizer", 5.57]], null, null, [["speech", 59.17], ["explosion", 8.36], ["busy signal", 4.23]]], "duration": [1.86, 14.09, 2.87, 0.79, 0.3, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/-CKzCdneg04_filtered.json b/annotations_filtered/-CKzCdneg04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba80e7eb86f5199d1fe8a4c6ccf627a216f28b20 --- /dev/null +++ b/annotations_filtered/-CKzCdneg04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [4.0, 5.48], [28.0, 27.94], [29.0, 29.15], [31.0, 31.14], [32.0, 33.51], [36.0, 35.72], [36.0, 36.93], [39.0, 39.55], [46.0, 45.79], [50.0, 50.03], [54.0, 53.92], [56.0, 60.59], [61.0, 63.04], [69.0, 73.55], [78.0, 87.08], [99.0, 99.37], [103.0, 109.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 44.87, 42.3, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.34], ["door", 2.71], ["telephone", 2.64]], [["speech", 61.25], ["ding", 11.35], ["thunk", 10.3]], null, null], "duration": [-0.02, 1.48, -0.06, 0.15, 0.14, 1.51, -0.28, 0.93, 0.55, -0.21, 0.03, -0.08, 4.59, 2.04, 4.55, 9.08, 0.37, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/-CSIqCS1WIk_filtered.json b/annotations_filtered/-CSIqCS1WIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43434f97cb91519933a57ebe7f1827c4ea60dc4e --- /dev/null +++ b/annotations_filtered/-CSIqCS1WIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.82], [5.0, 7.57], [9.0, 10.52], [11.0, 12.31], [14.0, 15.06], [18.0, 27.65], [30.0, 57.5], [58.0, 60.94], [62.0, 64.1], [67.0, 114.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 100.0, 0.0, 0.0, 0.0, 100.0, 99.8, 98.51, 91.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.82, 2.57, 1.52, 1.31, 1.06, 9.65, 27.5, 2.94, 2.1, 47.57]} \ No newline at end of file diff --git a/annotations_filtered/-CXBIAH4Kgo_filtered.json b/annotations_filtered/-CXBIAH4Kgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6835cf44bf826ae6a7a5a88065cefb836f636e11 --- /dev/null +++ b/annotations_filtered/-CXBIAH4Kgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [5.0, 6.44], [9.0, 13.1], [18.0, 19.62], [20.0, 23.01], [25.0, 25.27], [26.0, 39.75], [41.0, 44.64], [46.0, 47.28], [49.0, 51.11], [53.0, 56.0], [57.0, 58.95], [60.0, 61.42], [64.0, 66.14], [67.0, 71.24], [72.0, 74.34], [75.0, 76.65], [78.0, 79.68], [80.0, 87.93], [91.0, 92.94], [96.0, 97.12], [99.0, 102.25], [104.0, 105.17], [106.0, 108.11], [109.0, 129.44], [133.0, 134.79], [136.0, 137.66], [139.0, 140.95], [144.0, 145.96], [148.0, 150.25], [152.0, 154.95], [156.0, 156.44], [158.0, 158.4], [159.0, 161.86]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.1, 0.0, 37.35, 0.0, 47.66, 54.83, 0.0, 73.36, 58.81, 0.0, 0.0, 62.58, 60.7, 74.92, 0.0, 0.0, 42.17, 0.0, 0.0, 68.15, 0.0, 67.89, 66.76, 0.0, 0.0, 0.0, 0.0, 65.79, 37.73, 0.0, 0.0, 40.9], "audiomae_on_audioset": [null, null, [["speech", 31.48], ["explosion", 20.57], ["music", 11.66]], null, [["fly, housefly", 30.96], ["fowl", 9.91], ["creak", 7.03]], null, [["hum", 15.79], ["rumble", 14.23], ["music", 11.52]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.88], ["speech", 22.85], ["mains hum", 17.54]], null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 24.8], ["music", 24.74], ["hum", 4.13]], null, null, [["music", 45.36], ["speech", 39.28], ["whale vocalization", 2.24]]], "duration": [1.01, 1.44, 4.1, 1.62, 3.01, 0.27, 13.75, 3.64, 1.28, 2.11, 3.0, 1.95, 1.42, 2.14, 4.24, 2.34, 1.65, 1.68, 7.93, 1.94, 1.12, 3.25, 1.17, 2.11, 20.44, 1.79, 1.66, 1.95, 1.96, 2.25, 2.95, 0.44, 0.4, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/-CgUGjRFukQ_filtered.json b/annotations_filtered/-CgUGjRFukQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44554d57208a2cc7fa70d93cca7dbcd0ea44b160 --- /dev/null +++ b/annotations_filtered/-CgUGjRFukQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.46], [17.0, 17.29], [23.0, 24.27], [26.0, 27.35], [29.0, 29.3], [31.0, 31.95], [33.0, 34.57], [35.0, 35.95], [38.0, 38.8], [41.0, 41.1], [47.0, 47.19], [49.0, 51.26], [52.0, 55.46], [60.0, 62.02], [65.0, 66.07], [71.0, 71.86], [77.0, 77.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 48.06, 37.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 87.34], ["speech", 6.73], ["whale vocalization", 1.9]], [["didgeridoo", 50.89], ["music", 26.01], ["musical instrument", 2.61]], [["music", 12.37], ["hum", 8.58], ["vehicle", 5.67]], null, null, null], "duration": [1.46, 0.29, 1.27, 1.35, 0.3, 0.95, 1.57, 0.95, 0.8, 0.1, 0.19, 2.26, 3.46, 2.02, 1.07, 0.86, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/-CzO7z1dZ1A_filtered.json b/annotations_filtered/-CzO7z1dZ1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f1ddba8f0ecafa41bfe7e8bac9f79980bd58e03 --- /dev/null +++ b/annotations_filtered/-CzO7z1dZ1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 45.0], [53.0, 53.6], [58.0, 60.51], [63.0, 63.98], [69.0, 87.47]], "keep_status": [false, false, false, false, false], "silence_prob": [88.46, 0.0, 92.48, 0.0, 99.82], "audiomae_on_audioset": [null, null, null, null, null], "duration": [7.0, 0.6, 2.51, 0.98, 18.47]} \ No newline at end of file diff --git a/annotations_filtered/-DF-MgSuhQ0_filtered.json b/annotations_filtered/-DF-MgSuhQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..441c93656fdef2601b72918650f116fbb59ceee0 --- /dev/null +++ b/annotations_filtered/-DF-MgSuhQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.73], [13.0, 14.4], [16.0, 17.31], [18.0, 18.71], [19.0, 20.83], [24.0, 24.31], [27.0, 29.34], [31.0, 34.8], [35.0, 36.75], [38.0, 39.31], [41.0, 50.11], [51.0, 52.05], [54.0, 54.68], [56.0, 57.4], [58.0, 59.59], [63.0, 64.81], [66.0, 70.04], [71.0, 127.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 73.06, 0.0, 0.0, 34.61, 0.0, 0.0, 0.0, 0.0, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 28.83], ["music", 26.22], ["throbbing", 24.55]], null, null, null, null, null, [["hum", 17.16], ["rumble", 15.7], ["mains hum", 12.19]], null], "duration": [2.73, 1.4, 1.31, 0.71, 1.83, 0.31, 2.34, 3.8, 1.75, 1.31, 9.11, 1.05, 0.68, 1.4, 1.59, 1.81, 4.04, 56.06]} \ No newline at end of file diff --git a/annotations_filtered/-DXQJLwDAwg_filtered.json b/annotations_filtered/-DXQJLwDAwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24741c221a08374bf5c5775183ea311bc2bfc22 --- /dev/null +++ b/annotations_filtered/-DXQJLwDAwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [7.0, 7.91], [10.0, 10.0], [10.0, 10.49], [11.0, 12.66], [14.0, 14.22], [15.0, 19.21], [21.0, 21.81], [22.0, 23.03], [24.0, 25.22], [26.0, 28.39], [30.0, 33.35], [36.0, 37.74], [39.0, 43.75], [47.0, 48.32], [50.0, 50.84], [52.0, 54.65], [55.0, 55.95], [58.0, 58.68], [60.0, 59.86], [61.0, 61.82], [63.0, 66.48], [67.0, 67.81], [69.0, 69.42], [71.0, 74.07], [76.0, 76.44], [78.0, 78.39], [81.0, 81.19], [85.0, 85.46], [89.0, 89.78], [92.0, 92.52], [93.0, 93.53], [95.0, 95.79], [100.0, 100.55], [102.0, 103.28], [104.0, 104.95], [107.0, 107.64], [113.0, 114.08], [115.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 82.43, 79.07, 0.0, 63.21, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.91, 0.0, 0.49, 1.66, 0.22, 4.21, 0.81, 1.03, 1.22, 2.39, 3.35, 1.74, 4.75, 1.32, 0.84, 2.65, 0.95, 0.68, -0.14, 0.82, 3.48, 0.81, 0.42, 3.07, 0.44, 0.39, 0.19, 0.46, 0.78, 0.52, 0.53, 0.79, 0.55, 1.28, 0.95, 0.64, 1.08, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/-DXU2ZHuiTs_filtered.json b/annotations_filtered/-DXU2ZHuiTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3055202e3bd3de197e0c3ecf9b936f20c790d519 --- /dev/null +++ b/annotations_filtered/-DXU2ZHuiTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.16], [1.0, 1.54], [8.0, 8.21], [12.0, 11.92], [13.0, 13.73], [16.0, 16.39], [17.0, 17.66], [23.0, 23.04], [27.0, 28.22], [29.0, 29.4], [31.0, 31.45], [33.0, 33.84], [34.0, 34.74], [36.0, 36.83], [39.0, 39.12], [40.0, 40.09], [41.0, 41.81], [48.0, 48.63], [52.0, 51.98], [55.0, 54.97], [56.0, 56.4], [60.0, 60.39], [62.0, 61.87], [63.0, 62.92], [65.0, 65.35], [67.0, 67.31], [69.0, 69.33], [73.0, 73.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.54, 0.21, -0.08, 0.73, 0.39, 0.66, 0.04, 1.22, 0.4, 0.45, 0.84, 0.74, 0.83, 0.12, 0.09, 0.81, 0.63, -0.02, -0.03, 0.4, 0.39, -0.13, -0.08, 0.35, 0.31, 0.33, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/-DqmTaUK-Ow_filtered.json b/annotations_filtered/-DqmTaUK-Ow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37022a6c4cb9f8dc6753bd66e848eb62155559b --- /dev/null +++ b/annotations_filtered/-DqmTaUK-Ow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.33], [24.0, 25.73], [26.0, 34.1], [35.0, 38.38], [40.0, 49.4], [50.0, 52.25], [58.0, 59.34], [65.0, 65.52], [66.0, 66.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.51, 99.31, 68.41, 69.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.33, 1.73, 8.1, 3.38, 9.4, 2.25, 1.34, 0.52, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/-EZ9f-GgWVQ_filtered.json b/annotations_filtered/-EZ9f-GgWVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e47c95f985c9ddc12a4d96584a9b60a918937c4 --- /dev/null +++ b/annotations_filtered/-EZ9f-GgWVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.84], [9.0, 10.12], [12.0, 13.24], [16.0, 17.39], [19.0, 21.52], [23.0, 25.2], [33.0, 33.98], [35.0, 35.16], [38.0, 42.33], [43.0, 44.42], [46.0, 47.92], [48.0, 48.09], [49.0, 49.08], [52.0, 52.69], [54.0, 55.34], [57.0, 57.18], [60.0, 61.21], [62.0, 63.12], [65.0, 65.64], [66.0, 66.82], [68.0, 68.77], [70.0, 75.0], [78.0, 79.03], [81.0, 82.51], [84.0, 85.5], [88.0, 88.13], [90.0, 91.29], [96.0, 97.53], [99.0, 99.17], [101.0, 101.12], [102.0, 104.55], [112.0, 116.61], [117.0, 118.42], [120.0, 133.79], [134.0, 137.03], [138.0, 144.29], [147.0, 148.29], [150.0, 150.89], [156.0, 157.11], [159.0, 158.97], [160.0, 160.79], [163.0, 166.85]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [60.14, 0.0, 0.0, 0.0, 37.93, 41.87, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 38.59, 0.0, 33.98, 79.59, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38], "audiomae_on_audioset": [null, null, null, null, [["water", 19.27], ["speech", 13.46], ["liquid", 13.21]], [["sidetone", 74.54], ["speech", 17.17], ["radio", 1.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 32.92], ["speech", 13.75], ["chirp tone", 6.37]], null, [["speech", 42.61], ["thunk", 6.13], ["goat", 3.46]], null, null, null, null, null, null, null, null], "duration": [2.84, 1.12, 1.24, 1.39, 2.52, 2.2, 0.98, 0.16, 4.33, 1.42, 1.92, 0.09, 0.08, 0.69, 1.34, 0.18, 1.21, 1.12, 0.64, 0.82, 0.77, 5.0, 1.03, 1.51, 1.5, 0.13, 1.29, 1.53, 0.17, 0.12, 2.55, 4.61, 1.42, 13.79, 3.03, 6.29, 1.29, 0.89, 1.11, -0.03, 0.79, 3.85]} \ No newline at end of file diff --git a/annotations_filtered/-EuO6OFypLo_filtered.json b/annotations_filtered/-EuO6OFypLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad6b3e0b1d34f02bfce3f9da7d4e9c7c31e193c5 --- /dev/null +++ b/annotations_filtered/-EuO6OFypLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.07], [11.0, 11.15], [15.0, 23.67], [25.0, 25.49], [27.0, 27.65], [29.0, 29.76], [34.0, 35.68], [42.0, 42.43], [45.0, 45.66], [47.0, 48.09], [54.0, 55.29], [60.0, 61.33], [66.0, 68.93], [70.0, 71.46], [72.0, 72.93], [85.0, 85.43], [87.0, 89.18], [95.0, 98.56], [102.0, 105.31], [109.0, 111.15], [114.0, 121.85], [122.0, 126.89], [128.0, 130.74], [132.0, 145.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 31.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 59.15, 56.33, 54.43, 50.76, 39.69, 48.23, 53.72, 36.71], "audiomae_on_audioset": [null, null, [["didgeridoo", 54.15], ["music", 22.74], ["speech", 14.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 17.55], ["sidetone", 13.26], ["sine wave", 9.82]], [["sidetone", 36.27], ["speech", 7.18], ["hum", 6.21]], null, [["electric shaver, electric razor", 43.36], ["hum", 7.11], ["music", 4.27]]], "duration": [0.07, 0.15, 8.67, 0.49, 0.65, 0.76, 1.68, 0.43, 0.66, 1.09, 1.29, 1.33, 2.93, 1.46, 0.93, 0.43, 2.18, 3.56, 3.31, 2.15, 7.85, 4.89, 2.74, 13.89]} \ No newline at end of file diff --git a/annotations_filtered/-F1-sTyGvwA_filtered.json b/annotations_filtered/-F1-sTyGvwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17432c4b76c13d4686c227c777232bf63000b327 --- /dev/null +++ b/annotations_filtered/-F1-sTyGvwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.67], [12.0, 14.07], [15.0, 16.65], [18.0, 31.94], [35.0, 36.56], [38.0, 40.61], [41.0, 42.6], [43.0, 57.03], [58.0, 60.25], [61.0, 66.48], [68.0, 69.15], [69.0, 71.79], [73.0, 76.81], [77.0, 79.84], [81.0, 85.78], [86.0, 88.13], [90.0, 92.79], [94.0, 96.55], [97.0, 96.69], [97.0, 100.08], [100.0, 114.72], [116.0, 118.49], [119.0, 120.24], [121.0, 120.8], [121.0, 120.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.44, 0.0, 99.56, 0.0, 99.78, 0.0, 96.77, 98.66, 99.26, 0.0, 89.9, 93.6, 97.73, 88.83, 91.3, 97.33, 94.22, 0.0, 91.13, 78.55, 65.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 2.07, 1.65, 13.94, 1.56, 2.61, 1.6, 14.03, 2.25, 5.48, 1.15, 2.79, 3.81, 2.84, 4.78, 2.13, 2.79, 2.55, -0.31, 3.08, 14.72, 2.49, 1.24, -0.2, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/-FQOaUEE69I_filtered.json b/annotations_filtered/-FQOaUEE69I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99b2fd5fdac71c95187c9a0091f61a3a7ba29df0 --- /dev/null +++ b/annotations_filtered/-FQOaUEE69I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [4.0, 5.95], [15.0, 20.61], [22.0, 22.4], [23.0, 23.7], [24.0, 25.81], [26.0, 27.08], [28.0, 28.34], [30.0, 30.72], [31.0, 34.33], [35.0, 35.33], [40.0, 43.02], [44.0, 46.09], [48.0, 48.52], [50.0, 50.82], [52.0, 52.96], [57.0, 58.06], [62.0, 62.46], [64.0, 64.47], [66.0, 66.34], [68.0, 71.2], [73.0, 73.8], [75.0, 75.46], [77.0, 78.14], [79.0, 81.5], [84.0, 85.72], [87.0, 87.69], [91.0, 91.62], [93.0, 96.11], [97.0, 97.6], [99.0, 100.25], [104.0, 104.4], [107.0, 107.91], [110.0, 110.25], [111.0, 118.81], [120.0, 122.07], [123.0, 137.61], [139.0, 140.41], [143.0, 143.26], [148.0, 151.63], [152.0, 153.86], [154.0, 156.12], [156.0, 157.47], [158.0, 158.62], [160.0, 161.38], [162.0, 165.4], [166.0, 166.48], [167.0, 167.64], [175.0, 180.82]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 39.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 0.0, 99.44, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 34.43, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 56.1, 35.47, 0.0, 0.0, 52.39, 0.0, 47.12, 0.0, 0.0, 0.0, 30.41, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, [["speech", 44.89], ["sidetone", 13.71], ["chirp tone", 11.39]], null, null, null, null, null, null, [["speech", 42.88], ["crackle", 7.42], ["crushing", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.83], ["sine wave", 15.21], ["sidetone", 8.1]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 32.18], ["music", 29.24], ["mains hum", 12.57]], null, null, null, null, [["speech", 36.44], ["sidetone", 31.39], ["music", 8.37]], null, null, null, [["speech", 27.73], ["livestock, farm animals, working animals", 11.15], ["cattle, bovinae", 5.06]], null, null, [["music", 18.98], ["chirp tone", 13.64], ["crushing", 12.95]]], "duration": [0.71, 1.95, 5.61, 0.4, 0.7, 1.81, 1.08, 0.34, 0.72, 3.33, 0.33, 3.02, 2.09, 0.52, 0.82, 0.96, 1.06, 0.46, 0.47, 0.34, 3.2, 0.8, 0.46, 1.14, 2.5, 1.72, 0.69, 0.62, 3.11, 0.6, 1.25, 0.4, 0.91, 0.25, 7.81, 2.07, 14.61, 1.41, 0.26, 3.63, 1.86, 2.12, 1.47, 0.62, 1.38, 3.4, 0.48, 0.64, 5.82]} \ No newline at end of file diff --git a/annotations_filtered/-FU65KX7aJs_filtered.json b/annotations_filtered/-FU65KX7aJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09fa577aa9881c06d9cfe6230358c13bdaa9713b --- /dev/null +++ b/annotations_filtered/-FU65KX7aJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.58], [14.0, 15.28], [17.0, 16.95], [19.0, 39.48], [41.0, 52.96], [54.0, 69.43], [70.0, 74.93], [76.0, 77.58], [78.0, 97.44], [98.0, 98.88], [99.0, 100.03], [102.0, 103.03], [104.0, 105.33], [111.0, 111.0], [116.0, 117.07], [121.0, 122.52], [125.0, 125.81], [126.0, 126.32], [126.0, 130.45], [132.0, 132.93], [134.0, 137.42], [138.0, 138.32], [139.0, 139.85], [141.0, 141.89], [145.0, 148.1], [149.0, 149.18], [171.0, 171.22], [171.0, 171.36], [175.0, 174.77]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [59.24, 0.0, 0.0, 30.61, 32.83, 30.67, 39.7, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.69, 0.0, 49.54, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.55], ["didgeridoo", 17.69], ["fly, housefly", 10.38]], [["music", 58.18], ["synthesizer", 12.1], ["hum", 7.36]], [["music", 54.02], ["didgeridoo", 24.44], ["synthesizer", 4.28]], [["wheeze", 12.09], ["speech", 7.39], ["frog", 6.24]], null, [["speech", 38.1], ["animal", 17.99], ["livestock, farm animals, working animals", 12.74]], null, null, null, null, null, null, null, null, null, [["speech", 55.95], ["animal", 9.45], ["whale vocalization", 4.16]], null, [["hum", 29.43], ["mains hum", 18.48], ["music", 9.87]], null, null, null, [["mains hum", 28.61], ["hum", 27.62], ["radio", 8.48]], null, null, null, null], "duration": [4.58, 1.28, -0.05, 20.48, 11.96, 15.43, 4.93, 1.58, 19.44, 0.88, 1.03, 1.03, 1.33, 0.0, 1.07, 1.52, 0.81, 0.32, 4.45, 0.93, 3.42, 0.32, 0.85, 0.89, 3.1, 0.18, 0.22, 0.36, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/-G7OPYUlnT0_filtered.json b/annotations_filtered/-G7OPYUlnT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b58ce6615e635f88882f33bc4ddbf4180d3b14 --- /dev/null +++ b/annotations_filtered/-G7OPYUlnT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.89], [23.0, 23.26], [25.0, 25.29], [31.0, 30.89], [93.0, 93.24]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [-0.11, 0.26, 0.29, -0.11, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/-GSZwG_s-8A_filtered.json b/annotations_filtered/-GSZwG_s-8A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d1032edd542d8390bbfa6ecc5a6fa936df62d3 --- /dev/null +++ b/annotations_filtered/-GSZwG_s-8A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [3.0, 4.26], [7.0, 9.54], [10.0, 12.87], [13.0, 13.39], [17.0, 17.25], [20.0, 23.23], [24.0, 28.97], [29.0, 40.56], [41.0, 43.71], [45.0, 58.67], [59.0, 60.76], [61.0, 63.29], [64.0, 65.31], [67.0, 71.14], [72.0, 74.7], [75.0, 75.73], [77.0, 78.6], [80.0, 82.22], [84.0, 90.17], [90.0, 90.21], [94.0, 96.48], [98.0, 114.37], [117.0, 142.94], [146.0, 167.85], [171.0, 180.91], [181.0, 182.66], [183.0, 195.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 99.99, 94.81, 0.0, 0.0, 100.0, 97.43, 75.55, 100.0, 85.17, 0.0, 85.72, 0.0, 99.98, 100.0, 0.0, 0.0, 100.0, 98.01, 0.0, 50.11, 39.91, 37.24, 38.84, 52.86, 0.0, 38.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["ding", 21.15], ["cattle, bovinae", 20.11], ["livestock, farm animals, working animals", 16.65]], [["clang", 18.96], ["ding", 15.69], ["fly, housefly", 13.34]], [["fly, housefly", 56.08], ["insect", 19.37], ["mosquito", 9.11]], null, null, [["speech", 43.07], ["explosion", 7.66], ["buzz", 7.05]]], "duration": [1.44, 1.26, 2.54, 2.87, 0.39, 0.25, 3.23, 4.97, 11.56, 2.71, 13.67, 1.76, 2.29, 1.31, 4.14, 2.7, 0.73, 1.6, 2.22, 6.17, 0.21, 2.48, 16.37, 25.94, 21.85, 9.91, 1.66, 12.0]} \ No newline at end of file diff --git a/annotations_filtered/-G_I8dQHN5s_filtered.json b/annotations_filtered/-G_I8dQHN5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a49d86f0063c3d373e52acf55677352fa2cc78da --- /dev/null +++ b/annotations_filtered/-G_I8dQHN5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.31], [20.0, 20.29], [33.0, 33.71], [35.0, 36.98], [38.0, 39.53], [40.0, 44.63], [46.0, 47.28], [48.0, 48.51], [49.0, 51.38], [54.0, 55.81], [57.0, 57.55], [60.0, 60.18], [62.0, 66.29], [70.0, 71.96], [76.0, 76.5], [79.0, 78.8], [81.0, 82.83], [83.0, 85.87], [87.0, 88.23], [90.0, 91.45], [94.0, 93.92], [105.0, 104.6], [105.0, 105.83], [107.0, 107.18], [108.0, 108.48], [113.0, 113.0], [115.0, 116.68], [121.0, 120.85], [123.0, 128.02], [129.0, 129.46], [142.0, 141.67], [147.0, 150.2], [152.0, 152.66], [154.0, 156.52], [161.0, 173.03], [187.0, 187.62], [193.0, 193.21], [193.0, 193.41], [193.0, 194.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 0.0, 59.96, 0.0, 64.18, 55.11, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.34], ["mains hum", 18.99], ["hum", 7.49]], null, null, null, null, null, null, null, null, null, null, [["mains hum", 50.48], ["hum", 24.6], ["music", 16.73]], null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.29, 0.71, 1.98, 1.53, 4.63, 1.28, 0.51, 2.38, 1.81, 0.55, 0.18, 4.29, 1.96, 0.5, -0.2, 1.83, 2.87, 1.23, 1.45, -0.08, -0.4, 0.83, 0.18, 0.48, 0.0, 1.68, -0.15, 5.02, 0.46, -0.33, 3.2, 0.66, 2.52, 12.03, 0.62, 0.21, 0.41, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/-GaJPgI3jh4_filtered.json b/annotations_filtered/-GaJPgI3jh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc15c0082c4eabe473e54fdb64b8b495dd5b7585 --- /dev/null +++ b/annotations_filtered/-GaJPgI3jh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [17.0, 17.36], [22.0, 22.01], [27.0, 27.5], [30.0, 33.29], [48.0, 48.27], [74.0, 74.56], [77.0, 79.41], [106.0, 105.6], [107.0, 108.58], [114.0, 113.71], [129.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.36, 0.01, 0.5, 3.29, 0.27, 0.56, 2.41, -0.4, 1.58, -0.29, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/-H6l6-_elF0_filtered.json b/annotations_filtered/-H6l6-_elF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c01e2c0c035ff57a527d11c6468e11aa68e16e51 --- /dev/null +++ b/annotations_filtered/-H6l6-_elF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.13], [13.0, 14.25], [17.0, 17.69], [20.0, 21.29], [26.0, 37.62], [39.0, 48.19], [52.0, 52.44], [57.0, 57.79], [62.0, 62.53], [66.0, 67.32], [76.0, 76.86], [81.0, 81.7], [85.0, 86.36], [95.0, 96.08], [103.0, 105.76], [114.0, 115.53], [120.0, 120.78], [125.0, 125.81], [133.0, 133.24], [133.0, 138.7], [141.0, 142.01], [144.0, 145.56], [146.0, 148.44], [150.0, 150.35], [154.0, 154.97], [158.0, 157.72], [159.0, 159.95], [163.0, 163.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [96.17, 0.0, 0.0, 0.0, 78.55, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 10.24], ["thunk", 7.46], ["speech", 7.36]], null, null, null, null, null, null, null, null], "duration": [2.13, 1.25, 0.69, 1.29, 11.62, 9.19, 0.44, 0.79, 0.53, 1.32, 0.86, 0.7, 1.36, 1.08, 2.76, 1.53, 0.78, 0.81, 0.24, 5.7, 1.01, 1.56, 2.44, 0.35, 0.97, -0.28, 0.95, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/-HPjEz0u-9Q_filtered.json b/annotations_filtered/-HPjEz0u-9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d138c893701bac7605eccba9180f734e6c8a43b8 --- /dev/null +++ b/annotations_filtered/-HPjEz0u-9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.57], [40.0, 40.49], [42.0, 41.72], [45.0, 46.25], [48.0, 57.18], [61.0, 62.72], [65.0, 65.13], [67.0, 67.19], [67.0, 67.22], [67.0, 71.83], [73.0, 74.14], [83.0, 92.16], [94.0, 115.52], [116.0, 117.41], [119.0, 119.35], [121.0, 123.85]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 36.97, 0.0, 39.12, 37.65, 0.0, 0.0, 81.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 33.75], ["speech", 26.88], ["electric shaver, electric razor", 3.88]], null, [["speech", 51.44], ["music", 13.26], ["hum", 5.03]], [["speech", 27.98], ["thump, thud", 15.85], ["whack, thwack", 7.97]], null, null, null], "duration": [0.57, 0.49, -0.28, 1.25, 9.18, 1.72, 0.13, 0.19, 0.22, 4.83, 1.14, 9.16, 21.52, 1.41, 0.35, 2.85]} \ No newline at end of file diff --git a/annotations_filtered/-HTF_tAUtkQ_filtered.json b/annotations_filtered/-HTF_tAUtkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b47b23a810ae5aa0bab20d149656a19478c2b5 --- /dev/null +++ b/annotations_filtered/-HTF_tAUtkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.56], [16.0, 16.7], [24.0, 25.49], [37.0, 37.74], [42.0, 44.02], [49.0, 49.55], [60.0, 61.55], [65.0, 66.5], [85.0, 86.61], [89.0, 96.99], [105.0, 107.99], [108.0, 108.82], [116.0, 120.75]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.87, 0.0, 0.0, 0.0, 0.0, 30.8, 31.19, 0.0, 31.46], "audiomae_on_audioset": [null, null, null, null, [["music", 42.14], ["throbbing", 7.54], ["hum", 7.23]], null, null, null, null, [["speech", 38.58], ["music", 33.33], ["musical instrument", 2.41]], [["music", 30.55], ["speech", 12.0], ["fly, housefly", 9.55]], null, [["speech", 33.82], ["music", 24.08], ["musical instrument", 9.47]]], "duration": [1.56, 0.7, 1.49, 0.74, 2.02, 0.55, 1.55, 1.5, 1.61, 7.99, 2.99, 0.82, 4.75]} \ No newline at end of file diff --git a/annotations_filtered/-HwMH2_-oKA_filtered.json b/annotations_filtered/-HwMH2_-oKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-HwMH2_-oKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-IIHYIZSFbk_filtered.json b/annotations_filtered/-IIHYIZSFbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c93ec9f798a641fd5fa2974402b164e0ea29befa --- /dev/null +++ b/annotations_filtered/-IIHYIZSFbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.31], [16.0, 16.65], [18.0, 18.32], [20.0, 22.0], [24.0, 25.14], [26.0, 29.02], [30.0, 31.62], [33.0, 35.58], [39.0, 40.61], [42.0, 42.04], [43.0, 44.49], [45.0, 45.32], [46.0, 46.6], [48.0, 49.4], [50.0, 50.63], [55.0, 56.03], [57.0, 58.41], [61.0, 62.33], [63.0, 66.8], [68.0, 68.54], [71.0, 85.16], [86.0, 86.97], [90.0, 91.61], [93.0, 93.66], [97.0, 98.49], [100.0, 100.18]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.68, 0.0, 48.27, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["tuning fork", 56.11], ["speech", 7.42], ["singing bowl", 4.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.65, 0.32, 2.0, 1.14, 3.02, 1.62, 2.58, 1.61, 0.04, 1.49, 0.32, 0.6, 1.4, 0.63, 1.03, 1.41, 1.33, 3.8, 0.54, 14.16, 0.97, 1.61, 0.66, 1.49, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/-IV-ZZwXUkw_filtered.json b/annotations_filtered/-IV-ZZwXUkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af85df172e7e75acb26c186d4c1e0eeb169fff24 --- /dev/null +++ b/annotations_filtered/-IV-ZZwXUkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 26.13], [29.0, 30.69], [35.0, 40.22], [41.0, 43.88], [47.0, 52.44], [52.0, 116.23], [118.0, 124.95], [125.0, 163.73]], "keep_status": [false, false, true, true, true, false, true, false], "silence_prob": [30.6, 0.0, 28.97, 29.44, 28.46, 0.0, 28.72, 0.0], "audiomae_on_audioset": [[["throbbing", 56.58], ["hum", 10.19], ["music", 9.05]], null, [["music", 33.25], ["grunt", 15.2], ["fart", 12.17]], [["breaking", 28.12], ["whack, thwack", 15.12], ["music", 8.46]], [["zipper (clothing)", 30.8], ["whack, thwack", 11.18], ["smash, crash", 7.28]], null, [["groan", 18.26], ["music", 13.46], ["whack, thwack", 11.18]], null], "duration": [17.13, 1.69, 5.22, 2.88, 5.44, 64.23, 6.95, 38.73]} \ No newline at end of file diff --git a/annotations_filtered/-IZv4Jfl6ZQ_filtered.json b/annotations_filtered/-IZv4Jfl6ZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..462706e07ab34a221f35806bae22a99408fe689a --- /dev/null +++ b/annotations_filtered/-IZv4Jfl6ZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [11.0, 17.63], [23.0, 24.68], [28.0, 29.08], [34.0, 35.72], [38.0, 40.26], [46.0, 51.06], [58.0, 60.24], [62.0, 65.47], [67.0, 70.7], [73.0, 74.11], [80.0, 81.73], [94.0, 96.13], [98.0, 99.57], [100.0, 100.63], [102.0, 104.08]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 36.3, 0.0, 0.0, 0.0, 30.35, 30.95, 30.75, 30.32, 30.31, 0.0, 0.0, 49.64, 0.0, 0.0, 50.11], "audiomae_on_audioset": [null, [["music", 43.89], ["guitar", 13.73], ["musical instrument", 10.76]], null, null, null, [["music", 40.42], ["fart", 11.53], ["fly, housefly", 7.98]], [["music", 64.97], ["didgeridoo", 9.36], ["guitar", 3.49]], [["music", 65.27], ["musical instrument", 6.16], ["guitar", 4.76]], [["music", 74.18], ["musical instrument", 3.03], ["psychedelic rock", 2.24]], [["music", 79.02], ["theremin", 10.26], ["musical instrument", 1.99]], null, null, [["hum", 34.48], ["eruption", 10.34], ["throbbing", 10.06]], null, null, null], "duration": [0.48, 6.63, 1.68, 1.08, 1.72, 2.26, 5.06, 2.24, 3.47, 3.7, 1.11, 1.73, 2.13, 1.57, 0.63, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/-Ixi48TxkaA_filtered.json b/annotations_filtered/-Ixi48TxkaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9753da9dd391c15e775ca2d38f5761cc53365d14 --- /dev/null +++ b/annotations_filtered/-Ixi48TxkaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [4.0, 5.59], [13.0, 13.83], [17.0, 16.88], [20.0, 21.09], [23.0, 23.65], [25.0, 25.74], [27.0, 28.02], [28.0, 28.92], [29.0, 39.31], [40.0, 46.18], [48.0, 49.89], [50.0, 50.62], [52.0, 55.26], [58.0, 60.71], [62.0, 62.65], [67.0, 70.12], [76.0, 76.67], [80.0, 80.13], [83.0, 83.61], [85.0, 95.0], [96.0, 97.06], [100.0, 101.01], [103.0, 107.92], [108.0, 111.57], [113.0, 113.32], [115.0, 115.3], [117.0, 118.5], [119.0, 120.53], [123.0, 123.08], [124.0, 125.61], [127.0, 128.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 80.64, 0.0, 0.0, 98.44, 65.32, 0.0, 100.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 1.59, 0.83, -0.12, 1.09, 0.65, 0.74, 1.02, 0.92, 10.31, 6.18, 1.89, 0.62, 3.26, 2.71, 0.65, 3.12, 0.67, 0.13, 0.61, 10.0, 1.06, 1.01, 4.92, 3.57, 0.32, 0.3, 1.5, 1.53, 0.08, 1.61, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/-JERO2LQSKc_filtered.json b/annotations_filtered/-JERO2LQSKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cea8436fd9602075022dea10917cd6cf9f93195 --- /dev/null +++ b/annotations_filtered/-JERO2LQSKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.93], [4.0, 7.53], [8.0, 10.66], [12.0, 15.62], [17.0, 17.76], [21.0, 21.88], [35.0, 37.71], [44.0, 44.91], [73.0, 74.12], [76.0, 76.25], [77.0, 76.99], [87.0, 89.36], [90.0, 92.11], [105.0, 105.76], [106.0, 111.28], [112.0, 116.87], [119.0, 119.62], [120.0, 121.78], [125.0, 126.17], [128.0, 130.15], [131.0, 132.04], [138.0, 139.63], [140.0, 140.39], [147.0, 149.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 96.17, 89.54, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 77.7, 87.74, 0.0, 99.8, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.07, 3.53, 2.66, 3.62, 0.76, 0.88, 2.71, 0.91, 1.12, 0.25, -0.01, 2.36, 2.11, 0.76, 5.28, 4.87, 0.62, 1.78, 1.17, 2.15, 1.04, 1.63, 0.39, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/-JNyHnAi8zk_filtered.json b/annotations_filtered/-JNyHnAi8zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7038be175df2b36f1954f88fb078ade8fde0e50 --- /dev/null +++ b/annotations_filtered/-JNyHnAi8zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.11], [20.0, 20.73], [22.0, 23.35], [24.0, 25.44], [26.0, 35.33], [39.0, 40.05], [42.0, 53.35], [54.0, 55.71], [57.0, 57.11], [59.0, 65.6], [68.0, 85.14], [91.0, 100.55], [103.0, 119.28], [121.0, 123.5], [126.0, 148.81], [149.0, 150.21], [151.0, 151.56], [153.0, 170.6]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.69, 0.0, 0.0, 0.0, 28.99, 0.0, 29.89, 0.0, 0.0, 28.67, 28.77, 28.61, 28.68, 29.78, 28.67, 0.0, 0.0, 29.53], "audiomae_on_audioset": [[["music", 45.86], ["speech", 33.8], ["crowd", 1.63]], null, null, null, [["music", 48.28], ["speech", 5.84], ["buzz", 2.5]], null, [["music", 56.42], ["musical instrument", 3.38], ["middle eastern music", 3.11]], null, null, [["music", 55.47], ["speech", 22.82], ["electronic music", 4.18]], [["music", 61.66], ["speech", 7.65], ["vehicle", 5.05]], [["music", 91.63], ["ice cream truck, ice cream van", 1.27], ["speech", 1.13]], [["music", 83.45], ["speech", 12.02], ["electronic music", 0.56]], [["music", 44.67], ["middle eastern music", 9.38], ["musical instrument", 6.41]], [["music", 85.64], ["electronic music", 5.03], ["speech", 1.37]], null, null, [["music", 60.08], ["speech", 15.87], ["vehicle", 1.54]]], "duration": [12.11, 0.73, 1.35, 1.44, 9.33, 1.05, 11.35, 1.71, 0.11, 6.6, 17.14, 9.55, 16.28, 2.5, 22.81, 1.21, 0.56, 17.6]} \ No newline at end of file diff --git a/annotations_filtered/-J_tiDK1tEA_filtered.json b/annotations_filtered/-J_tiDK1tEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be1edafdf19a4549c3ea99c9fda0fe43fc0bb129 --- /dev/null +++ b/annotations_filtered/-J_tiDK1tEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.96], [15.0, 15.3], [17.0, 17.69], [23.0, 23.55], [24.0, 25.24], [29.0, 43.02], [47.0, 46.94], [51.0, 51.53], [53.0, 53.92], [55.0, 54.78], [55.0, 54.92], [59.0, 60.49], [65.0, 65.04], [69.0, 69.97], [71.0, 71.95], [80.0, 81.5], [85.0, 85.8], [90.0, 91.18], [99.0, 99.06], [104.0, 104.5], [107.0, 108.36], [111.0, 111.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.3, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.96, 0.3, 0.69, 0.55, 1.24, 14.02, -0.06, 0.53, 0.92, -0.22, -0.08, 1.49, 0.04, 0.97, 0.95, 1.5, 0.8, 1.18, 0.06, 0.5, 1.36, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/-JbSkxI2DrY_filtered.json b/annotations_filtered/-JbSkxI2DrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39ed9b0ccf53148305379d01d27121c50e11da93 --- /dev/null +++ b/annotations_filtered/-JbSkxI2DrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.03], [18.0, 18.1], [18.0, 19.09], [48.0, 48.42], [52.0, 53.38], [56.0, 56.96], [59.0, 59.91], [60.0, 61.86], [82.0, 82.59], [83.0, 88.16], [118.0, 118.99], [137.0, 140.41], [143.0, 148.85], [152.0, 153.25], [159.0, 159.76], [162.0, 162.13]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 30.31, 34.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 47.49], ["sidetone", 8.16], ["stomach rumble", 4.92]], null, [["music", 50.4], ["boing", 11.41], ["fart", 9.1]], [["music", 39.37], ["speech", 21.8], ["sidetone", 3.68]], null, null, null], "duration": [1.03, 0.1, 1.09, 0.42, 1.38, 0.96, 0.91, 1.86, 0.59, 5.16, 0.99, 3.41, 5.85, 1.25, 0.76, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/-Jf-E7oEguU_filtered.json b/annotations_filtered/-Jf-E7oEguU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cd507b521785b9cd717b45b43c4bd6a429b3224 --- /dev/null +++ b/annotations_filtered/-Jf-E7oEguU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 94.05]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [88.05]} \ No newline at end of file diff --git a/annotations_filtered/-JhNO_E3aEE_filtered.json b/annotations_filtered/-JhNO_E3aEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45bc1e7124ee5fe53fe1920cf55cb47b12142924 --- /dev/null +++ b/annotations_filtered/-JhNO_E3aEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.03], [7.0, 7.7], [8.0, 8.18], [10.0, 10.69], [12.0, 12.23], [14.0, 14.5], [24.0, 24.92], [26.0, 29.08], [30.0, 29.83], [31.0, 31.11], [32.0, 31.85], [33.0, 33.91], [38.0, 44.12], [45.0, 45.59], [46.0, 47.22], [48.0, 49.91], [51.0, 52.44], [54.0, 67.9], [69.0, 73.95], [76.0, 76.25], [77.0, 82.76], [84.0, 83.98], [85.0, 88.94], [91.0, 93.24], [94.0, 94.91], [96.0, 96.23], [97.0, 100.84], [102.0, 102.86], [104.0, 104.73], [106.0, 107.47], [112.0, 113.88], [115.0, 116.78], [118.0, 118.57], [119.0, 121.81], [123.0, 132.49], [134.0, 134.79], [135.0, 180.39], [181.0, 185.43], [187.0, 191.66], [193.0, 196.94], [200.0, 204.26], [209.0, 211.94], [214.0, 218.13], [218.0, 220.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.56, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 64.52, 45.75, 0.0, 96.77, 0.0, 58.89, 82.61, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 97.83, 0.0, 0.0, 99.31, 94.37, 81.71, 79.94, 81.17, 72.75, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 73.25], ["thunk", 3.4], ["inside, small room", 1.41]], null, null, null, null, [["speech", 48.32], ["heart sounds, heartbeat", 12.75], ["stomach rumble", 11.88]], null, null, null, null, null, [["hum", 46.92], ["mains hum", 17.11], ["speech", 7.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.03, 0.7, 0.18, 0.69, 0.23, 0.5, 0.92, 3.08, -0.17, 0.11, -0.15, 0.91, 6.12, 0.59, 1.22, 1.91, 1.44, 13.9, 4.95, 0.25, 5.76, -0.02, 3.94, 2.24, 0.91, 0.23, 3.84, 0.86, 0.73, 1.47, 1.88, 1.78, 0.57, 2.81, 9.49, 0.79, 45.39, 4.43, 4.66, 3.94, 4.26, 2.94, 4.13, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/-Jzi-2lYWEw_filtered.json b/annotations_filtered/-Jzi-2lYWEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d95c9abd6eb3180185be09b220290ab0c10158a --- /dev/null +++ b/annotations_filtered/-Jzi-2lYWEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [11.0, 12.65], [13.0, 13.29], [16.0, 16.85], [22.0, 21.78], [25.0, 26.16], [27.0, 27.26], [29.0, 29.83], [31.0, 31.82], [32.0, 33.02], [36.0, 37.88], [39.0, 42.28], [44.0, 43.73], [50.0, 51.53], [61.0, 63.36], [66.0, 67.0], [75.0, 77.52], [91.0, 93.48], [98.0, 97.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 100.0, 0.0, 99.84, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 1.65, 0.29, 0.85, -0.22, 1.16, 0.26, 0.83, 0.82, 1.02, 1.88, 3.28, -0.27, 1.53, 2.36, 1.0, 2.52, 2.48, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/-KOG8edoC00_filtered.json b/annotations_filtered/-KOG8edoC00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a78a18a175486aefb11c8514feb06fce084ee0b --- /dev/null +++ b/annotations_filtered/-KOG8edoC00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.15], [29.0, 31.62], [33.0, 32.86], [35.0, 50.65], [57.0, 58.72], [60.0, 63.93], [66.0, 66.95], [67.0, 67.83], [68.0, 69.96], [70.0, 70.61], [72.0, 74.58], [75.0, 87.12], [88.0, 89.9], [94.0, 94.8], [98.0, 101.04], [102.0, 102.84], [111.0, 111.4], [115.0, 115.45], [116.0, 116.65], [118.0, 120.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.99, 100.0, 0.0, 99.21, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 99.26, 68.54, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 31.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.13], ["foghorn", 13.24], ["musical instrument", 7.35]]], "duration": [3.15, 2.62, -0.14, 15.65, 1.72, 3.93, 0.95, 0.83, 1.96, 0.61, 2.58, 12.12, 1.9, 0.8, 3.04, 0.84, 0.4, 0.45, 0.65, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/-KVNfZo-cfc_filtered.json b/annotations_filtered/-KVNfZo-cfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2466a276d874959d071383550cfa5929ce89bc95 --- /dev/null +++ b/annotations_filtered/-KVNfZo-cfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [4.0, 5.04], [6.0, 6.08], [10.0, 10.3], [11.0, 11.26], [12.0, 12.56], [15.0, 15.16], [18.0, 18.81], [21.0, 22.84], [23.0, 25.29], [26.0, 29.89], [33.0, 34.5], [36.0, 36.78], [37.0, 37.98], [39.0, 39.39], [40.0, 43.23], [46.0, 46.89], [48.0, 48.2], [49.0, 49.25], [50.0, 50.18], [50.0, 52.25], [55.0, 55.22], [56.0, 58.29], [60.0, 60.27], [63.0, 63.54], [66.0, 66.61], [71.0, 71.76], [91.0, 91.54], [93.0, 94.46], [95.0, 96.9], [98.0, 99.03], [100.0, 101.51], [102.0, 104.38], [106.0, 107.45], [109.0, 111.77], [113.0, 116.13], [118.0, 118.77], [120.0, 120.95], [122.0, 123.48], [126.0, 127.28], [128.0, 129.29], [131.0, 133.98], [136.0, 137.96], [139.0, 147.39], [151.0, 152.29], [155.0, 155.92], [158.0, 161.6], [168.0, 169.25], [171.0, 171.21], [173.0, 173.45], [175.0, 176.98], [180.0, 184.87], [186.0, 188.87], [190.0, 191.42], [193.0, 194.78], [196.0, 196.45], [198.0, 199.35], [201.0, 201.55], [203.0, 204.31], [205.0, 206.95], [209.0, 209.39], [210.0, 224.24], [228.0, 229.17], [231.0, 235.28], [236.0, 239.79], [241.0, 242.06], [244.0, 248.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 94.37, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 99.59, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 96.42, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 99.95, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.2, 0.0, 85.17, 92.15, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 60.93], ["speech", 6.52], ["sidetone", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 38.5], ["mains hum", 24.84], ["throbbing", 16.21]], null, null, null, null, null], "duration": [0.86, 1.04, 0.08, 0.3, 0.26, 0.56, 0.16, 0.81, 1.84, 2.29, 3.89, 1.5, 0.78, 0.98, 0.39, 3.23, 0.89, 0.2, 0.25, 0.18, 2.25, 0.22, 2.29, 0.27, 0.54, 0.61, 0.76, 0.54, 1.46, 1.9, 1.03, 1.51, 2.38, 1.45, 2.77, 3.13, 0.77, 0.95, 1.48, 1.28, 1.29, 2.98, 1.96, 8.39, 1.29, 0.92, 3.6, 1.25, 0.21, 0.45, 1.98, 4.87, 2.87, 1.42, 1.78, 0.45, 1.35, 0.55, 1.31, 1.95, 0.39, 14.24, 1.17, 4.28, 3.79, 1.06, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/-KW0wz1xBfw_filtered.json b/annotations_filtered/-KW0wz1xBfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..624dedb84608a1e595f1dd53512b2cbb9acca7af --- /dev/null +++ b/annotations_filtered/-KW0wz1xBfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.09], [17.0, 19.9], [20.0, 26.03], [26.0, 26.5], [27.0, 27.62], [28.0, 27.89], [29.0, 29.64], [32.0, 96.55], [100.0, 121.73], [122.0, 127.13], [128.0, 130.57], [132.0, 134.91], [136.0, 138.37]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 63.53, 39.72, 0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 99.99, 90.95, 99.26, 60.6], "audiomae_on_audioset": [null, null, [["music", 51.35], ["theremin", 7.7], ["singing bowl", 5.05]], null, null, null, null, null, [["rumble", 19.05], ["explosion", 14.27], ["hum", 9.71]], null, null, null, null], "duration": [0.09, 2.9, 6.03, 0.5, 0.62, -0.11, 0.64, 64.55, 21.73, 5.13, 2.57, 2.91, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/-Kd5zqw24S4_filtered.json b/annotations_filtered/-Kd5zqw24S4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c486c302c2843f031db152cc621c98caa59bc445 --- /dev/null +++ b/annotations_filtered/-Kd5zqw24S4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.61], [11.0, 12.63], [14.0, 15.26], [18.0, 18.74], [22.0, 22.25], [25.0, 26.42], [31.0, 34.1], [35.0, 37.03], [38.0, 41.4], [44.0, 44.29], [44.0, 47.55], [48.0, 49.1], [50.0, 55.9], [58.0, 62.18], [63.0, 70.04], [70.0, 74.61], [76.0, 79.19], [80.0, 81.18], [82.0, 88.69], [90.0, 92.37], [93.0, 95.39], [96.0, 97.53], [98.0, 100.28], [102.0, 105.97], [108.0, 110.02], [114.0, 119.18], [122.0, 125.61], [127.0, 141.07], [142.0, 146.97], [149.0, 151.78], [153.0, 153.71], [155.0, 156.49], [157.0, 159.46], [160.0, 166.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.45, 100.0, 0.0, 100.0, 0.0, 100.0, 99.99, 100.0, 96.04, 100.0, 0.0, 100.0, 100.0, 98.01, 0.0, 99.99, 100.0, 100.0, 99.98, 99.48, 99.76, 96.54, 99.73, 0.0, 0.0, 99.1, 99.52], "audiomae_on_audioset": [[["music", 19.87], ["smash, crash", 11.37], ["whack, thwack", 9.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.61, 1.63, 1.26, 0.74, 0.25, 1.42, 3.1, 2.03, 3.4, 0.29, 3.55, 1.1, 5.9, 4.18, 7.04, 4.61, 3.19, 1.18, 6.69, 2.37, 2.39, 1.53, 2.28, 3.97, 2.02, 5.18, 3.61, 14.07, 4.97, 2.78, 0.71, 1.49, 2.46, 6.94]} \ No newline at end of file diff --git a/annotations_filtered/-Koj9hvcBMk_filtered.json b/annotations_filtered/-Koj9hvcBMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1450859ed17638a1d8bcfa004f964f709591061 --- /dev/null +++ b/annotations_filtered/-Koj9hvcBMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.63], [25.0, 26.52], [27.0, 28.17], [37.0, 38.55], [43.0, 46.13], [47.0, 47.44], [48.0, 48.81], [51.0, 51.66], [53.0, 53.89], [56.0, 56.54], [58.0, 58.01], [59.0, 59.56], [61.0, 61.11], [77.0, 82.56], [85.0, 86.1], [86.0, 86.97], [89.0, 90.24], [98.0, 98.22], [99.0, 99.0], [104.0, 104.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.63, 1.52, 1.17, 1.55, 3.13, 0.44, 0.81, 0.66, 0.89, 0.54, 0.01, 0.56, 0.11, 5.56, 1.1, 0.97, 1.24, 0.22, 0.0, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/-Kztqrjp2yw_filtered.json b/annotations_filtered/-Kztqrjp2yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..870359429a856e8e507fad8d094cc9d7f271302b --- /dev/null +++ b/annotations_filtered/-Kztqrjp2yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [3.0, 3.5], [5.0, 5.48], [6.0, 6.67], [8.0, 90.78], [92.0, 92.53], [94.0, 97.19], [99.0, 102.49], [106.0, 107.77], [111.0, 114.93], [116.0, 117.59], [119.0, 122.47], [127.0, 129.19], [133.0, 133.78], [136.0, 140.86], [144.0, 144.32], [147.0, 160.79], [162.0, 175.36], [177.0, 184.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 99.84, 0.0, 100.0, 0.0, 99.76, 81.0, 0.0, 59.15, 0.0, 30.67, 32.25, 55.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 38.68], ["cattle, bovinae", 31.7], ["moo", 22.6]], [["music", 14.27], ["fly, housefly", 11.78], ["sidetone", 7.68]], null], "duration": [-0.25, 0.5, 0.48, 0.67, 82.78, 0.53, 3.19, 3.49, 1.77, 3.93, 1.59, 3.47, 2.19, 0.78, 4.86, 0.32, 13.79, 13.36, 7.47]} \ No newline at end of file diff --git a/annotations_filtered/-L3D0BL9ieA_filtered.json b/annotations_filtered/-L3D0BL9ieA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4a3bf4dcc65828bcbfd5e909a7d4c7b4069c930 --- /dev/null +++ b/annotations_filtered/-L3D0BL9ieA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 22.15], [23.0, 24.81], [27.0, 33.07], [36.0, 36.37], [38.0, 40.42], [42.0, 46.63], [50.0, 64.93], [70.0, 70.21], [76.0, 94.61], [95.0, 95.2], [95.0, 120.33], [122.0, 122.59]], "keep_status": [false, false, true, false, false, true, true, false, true, false, true, false], "silence_prob": [30.99, 0.0, 46.54, 0.0, 51.88, 38.17, 29.6, 0.0, 30.21, 0.0, 29.99, 0.0], "audiomae_on_audioset": [[["speech", 58.47], ["hum", 8.76], ["music", 4.16]], null, [["music", 59.63], ["synthesizer", 5.1], ["electronic music", 3.78]], null, null, [["speech", 20.54], ["cattle, bovinae", 18.53], ["livestock, farm animals, working animals", 8.28]], [["speech", 30.74], ["music", 11.83], ["buzz", 8.28]], null, [["music", 30.74], ["animal", 17.42], ["speech", 7.46]], null, [["music", 34.72], ["whip", 10.58], ["whack, thwack", 10.3]], null], "duration": [15.15, 1.81, 6.07, 0.37, 2.42, 4.63, 14.93, 0.21, 18.61, 0.2, 25.33, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/-L9EZRMgmXM_filtered.json b/annotations_filtered/-L9EZRMgmXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e87244e6d2ee32900fb1791a4bb65552f1ab8c89 --- /dev/null +++ b/annotations_filtered/-L9EZRMgmXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 45.27], [54.0, 64.81], [68.0, 68.98], [73.0, 73.9], [74.0, 76.77], [80.0, 82.16], [83.0, 85.77], [89.0, 89.38], [91.0, 91.59], [94.0, 95.0], [97.0, 97.31], [100.0, 101.7], [104.0, 104.58], [107.0, 108.09], [110.0, 110.91], [112.0, 113.34], [117.0, 117.37], [119.0, 119.72]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.58, 39.82, 0.0, 0.0, 69.07, 82.97, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.7], ["speech", 26.83], ["throbbing", 5.76]], [["insect", 17.09], ["hum", 15.07], ["fly, housefly", 11.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.27, 10.81, 0.98, 0.9, 2.77, 2.16, 2.77, 0.38, 0.59, 1.0, 0.31, 1.7, 0.58, 1.09, 0.91, 1.34, 0.37, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/-LCqZeb1de0_filtered.json b/annotations_filtered/-LCqZeb1de0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ff95584a343a0a3669a7a61562dbee0d3425469 --- /dev/null +++ b/annotations_filtered/-LCqZeb1de0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [9.0, 10.02], [14.0, 15.04], [16.0, 20.28], [23.0, 23.09], [26.0, 26.22], [28.0, 28.29], [33.0, 35.14], [36.0, 38.13], [46.0, 47.95], [54.0, 62.11], [69.0, 69.99], [75.0, 88.37], [90.0, 90.59], [92.0, 92.67], [95.0, 103.05], [106.0, 108.55], [112.0, 113.0], [116.0, 123.25], [126.0, 127.82], [134.0, 135.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 89.9, 60.89, 0.0, 92.97, 0.0, 99.98, 0.0, 0.0, 99.88, 99.95, 0.0, 83.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.02, 1.04, 4.28, 0.09, 0.22, 0.29, 2.14, 2.13, 1.95, 8.11, 0.99, 13.37, 0.59, 0.67, 8.05, 2.55, 1.0, 7.25, 1.82, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/-LjxKR0q7Yo_filtered.json b/annotations_filtered/-LjxKR0q7Yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef1b6a322f6e9a4481e1b317bc7466ecd312f104 --- /dev/null +++ b/annotations_filtered/-LjxKR0q7Yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.89], [23.0, 29.73], [32.0, 38.91], [41.0, 42.5], [43.0, 59.48], [60.0, 63.26], [64.0, 67.22], [69.0, 83.34], [87.0, 91.47], [97.0, 109.29], [113.0, 114.61]], "keep_status": [false, true, true, false, true, true, false, true, true, true, false], "silence_prob": [0.0, 36.16, 31.91, 0.0, 34.94, 39.4, 30.5, 32.06, 44.57, 32.75, 0.0], "audiomae_on_audioset": [null, [["speech", 31.97], ["animal", 22.74], ["livestock, farm animals, working animals", 5.04]], [["speech", 34.84], ["fly, housefly", 11.78], ["insect", 8.35]], null, [["animal", 41.98], ["livestock, farm animals, working animals", 6.87], ["goose", 6.03]], [["speech", 25.44], ["music", 15.09], ["animal", 8.5]], [["speech", 61.0], ["music", 19.53], ["hum", 1.19]], [["speech", 45.54], ["mosquito", 5.83], ["explosion", 4.28]], [["mosquito", 29.76], ["whale vocalization", 17.4], ["fly, housefly", 16.54]], [["speech", 30.9], ["animal", 27.47], ["bow-wow", 3.91]], null], "duration": [0.89, 6.73, 6.91, 1.5, 16.48, 3.26, 3.22, 14.34, 4.47, 12.29, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/-Lrndfrc9yU_filtered.json b/annotations_filtered/-Lrndfrc9yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-Lrndfrc9yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-Luy502C920_filtered.json b/annotations_filtered/-Luy502C920_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03d39c31b44cb837becad5eea59fb910b63726ef --- /dev/null +++ b/annotations_filtered/-Luy502C920_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.57], [29.0, 29.66], [49.0, 49.69], [57.0, 58.35], [62.0, 62.55], [67.0, 71.07], [72.0, 72.4], [78.0, 93.34], [94.0, 122.05]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 32.88, 31.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 59.67], ["trance music", 7.81], ["techno", 5.64]], [["music", 35.67], ["skidding", 18.6], ["vehicle", 13.64]]], "duration": [1.57, 0.66, 0.69, 1.35, 0.55, 4.07, 0.4, 15.34, 28.05]} \ No newline at end of file diff --git a/annotations_filtered/-MEOfLvOuas_filtered.json b/annotations_filtered/-MEOfLvOuas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ddb969369a0c1ba9ae1fe66e82e1cc8e41f99d8 --- /dev/null +++ b/annotations_filtered/-MEOfLvOuas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.54], [19.0, 20.06], [21.0, 21.56], [22.0, 25.19], [30.0, 29.98], [33.0, 33.34], [37.0, 38.06], [42.0, 42.42], [47.0, 48.37], [50.0, 51.14], [52.0, 53.22], [67.0, 67.91], [69.0, 82.17], [87.0, 87.34], [90.0, 91.18]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 20.6], ["hum", 16.94], ["music", 10.94]], null, null, null, null, null, null, null, null, [["music", 47.94], ["theremin", 15.21], ["hum", 6.29]], null, null], "duration": [1.54, 1.06, 0.56, 3.19, -0.02, 0.34, 1.06, 0.42, 1.37, 1.14, 1.22, 0.91, 13.17, 0.34, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/-MNpOKICOx8_filtered.json b/annotations_filtered/-MNpOKICOx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f57ea9414141946842d323b760118425160aab3 --- /dev/null +++ b/annotations_filtered/-MNpOKICOx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 7.89], [10.0, 9.78], [11.0, 11.89], [18.0, 19.74], [22.0, 25.59], [26.0, 26.35], [34.0, 35.4], [38.0, 37.99], [48.0, 49.69], [50.0, 50.25], [51.0, 52.41], [54.0, 57.33], [59.0, 60.99], [63.0, 63.59], [64.0, 64.35], [66.0, 77.57], [80.0, 81.77], [86.0, 93.02], [93.0, 94.74], [96.0, 96.84], [97.0, 100.74], [103.0, 103.17], [106.0, 106.57], [112.0, 113.22], [114.0, 117.83], [118.0, 119.85], [121.0, 121.36], [122.0, 123.42], [124.0, 132.61], [133.0, 134.64], [138.0, 138.86], [140.0, 140.0]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.26, 0.0, 0.0, 0.0, 36.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 45.49, 0.0, 67.13, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 27.19], ["speech", 12.83], ["fly, housefly", 12.71]], null, null, null, [["music", 22.44], ["speech", 13.4], ["frog", 11.1]], null, null, null, null, null, null, null, null, null, null, [["thunk", 77.32], ["music", 10.1], ["mosquito", 3.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 2.89, -0.22, 0.89, 1.74, 3.59, 0.35, 1.4, -0.01, 1.69, 0.25, 1.41, 3.33, 1.99, 0.59, 0.35, 11.57, 1.77, 7.02, 1.74, 0.84, 3.74, 0.17, 0.57, 1.22, 3.83, 1.85, 0.36, 1.42, 8.61, 1.64, 0.86, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/-MQNNzaEt2s_filtered.json b/annotations_filtered/-MQNNzaEt2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71325a7c5cd5fc7d250cb411e19a4af76a90c59d --- /dev/null +++ b/annotations_filtered/-MQNNzaEt2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.77], [28.0, 28.26], [29.0, 30.54], [33.0, 33.91]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.77, 0.26, 1.54, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/-Mmq6Kmd75I_filtered.json b/annotations_filtered/-Mmq6Kmd75I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..484a0a18769e9a405b8716e52f98c667d88da1d4 --- /dev/null +++ b/annotations_filtered/-Mmq6Kmd75I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.46], [19.0, 19.16], [21.0, 21.29], [24.0, 24.81], [27.0, 29.86], [41.0, 43.6], [44.0, 45.33], [47.0, 49.3], [51.0, 53.65], [56.0, 56.27], [66.0, 67.2], [69.0, 70.85], [73.0, 74.56], [76.0, 77.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.06, 62.78, 0.0, 95.23, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 63.04], ["music", 8.18], ["hum", 2.86]], null, null, null, null, null, null, null, null, null], "duration": [1.46, 0.16, 0.29, 0.81, 2.86, 2.6, 1.33, 2.3, 2.65, 0.27, 1.2, 1.85, 1.56, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/-N2mhlvygq0_filtered.json b/annotations_filtered/-N2mhlvygq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91f79c787c19bfb7207caccd5868b1952589e183 --- /dev/null +++ b/annotations_filtered/-N2mhlvygq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.8], [12.0, 16.65], [24.0, 27.16], [36.0, 36.05], [36.0, 38.15], [45.0, 45.74], [56.0, 57.01], [69.0, 75.0], [75.0, 109.05], [121.0, 121.68], [122.0, 122.82], [125.0, 125.04], [126.0, 125.98]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.98, 66.51, 0.0, 87.37, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 23.09], ["cattle, bovinae", 22.59], ["animal", 16.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 4.65, 3.16, 0.05, 2.15, 0.74, 1.01, 6.0, 34.05, 0.68, 0.82, 0.04, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/-NW-w5Z_vpk_filtered.json b/annotations_filtered/-NW-w5Z_vpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e62efd9fdb5e352644ddf8f47754ef178c0e6d6c --- /dev/null +++ b/annotations_filtered/-NW-w5Z_vpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [12.0, 12.09], [13.0, 15.82], [19.0, 20.21], [22.0, 28.75], [31.0, 34.01], [35.0, 35.26], [36.0, 36.46], [40.0, 43.39], [45.0, 53.7], [55.0, 80.23], [83.0, 83.4], [88.0, 113.09], [119.0, 120.56], [121.0, 122.3]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 99.92, 0.0, 81.53, 99.96, 0.0, 0.0, 42.28, 50.11, 46.33, 0.0, 40.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 24.14], ["hum", 23.5], ["throbbing", 15.63]], null, [["music", 44.83], ["synthesizer", 17.53], ["ambient music", 6.2]], null, [["speech", 26.87], ["music", 17.49], ["hum", 10.92]], null, null], "duration": [0.64, 0.09, 2.82, 1.21, 6.75, 3.01, 0.26, 0.46, 3.39, 8.7, 25.23, 0.4, 25.09, 1.56, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/-NeY5tqk1N8_filtered.json b/annotations_filtered/-NeY5tqk1N8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f98a64d99d5a30067ea602640357fef3cf250d6 --- /dev/null +++ b/annotations_filtered/-NeY5tqk1N8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [3.0, 4.56], [9.0, 15.72], [17.0, 18.54], [19.0, 21.86], [23.0, 25.0], [29.0, 30.74], [36.0, 36.93], [38.0, 39.39], [42.0, 43.24], [44.0, 44.98], [53.0, 54.16], [55.0, 58.24], [61.0, 64.37], [68.0, 68.77], [70.0, 69.74], [73.0, 74.98], [77.0, 78.46], [80.0, 84.87], [85.0, 86.86], [90.0, 91.12], [96.0, 95.82], [98.0, 98.1], [98.0, 99.3], [106.0, 105.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 0.0, 91.47, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 62.37, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 1.56, 6.72, 1.54, 2.86, 2.0, 1.74, 0.93, 1.39, 1.24, 0.98, 1.16, 3.24, 3.37, 0.77, -0.26, 1.98, 1.46, 4.87, 1.86, 1.12, -0.18, 0.1, 1.3, -0.39]} \ No newline at end of file diff --git a/annotations_filtered/-NgmhVRFApQ_filtered.json b/annotations_filtered/-NgmhVRFApQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a48d4de11b2e7ba2d57e54531027047acab5b974 --- /dev/null +++ b/annotations_filtered/-NgmhVRFApQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 5.71], [10.0, 12.53], [14.0, 14.77], [16.0, 19.43], [21.0, 21.83], [22.0, 28.83], [31.0, 31.9], [33.0, 33.17], [33.0, 35.9], [36.0, 44.36], [46.0, 46.85], [48.0, 49.13], [52.0, 54.5], [56.0, 57.69], [59.0, 60.45], [62.0, 62.83], [69.0, 70.38], [71.0, 73.55], [75.0, 76.5], [81.0, 81.55], [84.0, 85.4], [86.0, 87.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.05, 0.0, 70.02, 0.0, 0.0, 99.68, 57.89, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.71, 2.53, 0.77, 3.43, 0.83, 6.83, 0.9, 0.17, 2.9, 8.36, 0.85, 1.13, 2.5, 1.69, 1.45, 0.83, 1.38, 2.55, 1.5, 0.55, 1.4, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/-Nr56-RD_g8_filtered.json b/annotations_filtered/-Nr56-RD_g8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42e1726f7ff987c84ec2dd5aa61f8277ebdbf078 --- /dev/null +++ b/annotations_filtered/-Nr56-RD_g8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [14.0, 14.91], [16.0, 15.84], [29.0, 37.56], [53.0, 55.14], [64.0, 65.15]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.3, 62.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.44, 0.91, -0.16, 8.56, 2.14, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/-NtpPdMGluE_filtered.json b/annotations_filtered/-NtpPdMGluE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5117dd494e46138f7042642d2058c11769b66a8b --- /dev/null +++ b/annotations_filtered/-NtpPdMGluE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.98], [4.0, 5.85], [6.0, 7.08], [8.0, 8.63], [10.0, 17.52], [20.0, 31.73], [33.0, 34.79], [36.0, 59.04], [60.0, 62.6], [64.0, 64.74], [66.0, 66.56], [68.0, 76.98], [77.0, 86.95], [88.0, 91.39], [93.0, 95.61], [97.0, 114.03], [116.0, 119.45], [121.0, 135.67], [140.0, 142.15], [146.0, 147.72], [152.0, 152.54], [157.0, 158.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.43, 59.51, 0.0, 88.46, 98.27, 0.0, 0.0, 92.15, 99.1, 48.48, 51.6, 60.32, 67.51, 73.97, 60.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 21.87], ["sidetone", 21.61], ["speech", 17.95]], null, null, null, null, null, null, null, null], "duration": [-0.02, 1.85, 1.08, 0.63, 7.52, 11.73, 1.79, 23.04, 2.6, 0.74, 0.56, 8.98, 9.95, 3.39, 2.61, 17.03, 3.45, 14.67, 2.15, 1.72, 0.54, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/-Nzbwerwks8_filtered.json b/annotations_filtered/-Nzbwerwks8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd6fecc044274505cb2ecf33e3948d318967d6a --- /dev/null +++ b/annotations_filtered/-Nzbwerwks8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [5.0, 5.86], [6.0, 12.97], [18.0, 19.21], [20.0, 23.06], [26.0, 28.95], [34.0, 39.63], [42.0, 42.09], [43.0, 44.83], [50.0, 54.41], [55.0, 73.7], [79.0, 82.31], [84.0, 84.86], [86.0, 92.77], [98.0, 101.33], [105.0, 108.51], [115.0, 119.62]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 39.11, 0.0, 34.11, 33.41, 31.43, 0.0, 0.0, 31.21, 30.91, 30.75, 0.0, 31.68, 47.54, 36.56, 32.04], "audiomae_on_audioset": [null, null, [["speech", 47.52], ["music", 15.35], ["hum", 12.1]], null, [["speech", 52.2], ["music", 8.99], ["sidetone", 8.27]], [["speech", 57.53], ["fly, housefly", 6.35], ["music", 3.85]], [["speech", 22.43], ["fart", 12.6], ["cattle, bovinae", 9.65]], null, null, [["speech", 71.3], ["music", 6.04], ["explosion", 2.52]], [["speech", 70.13], ["breaking", 8.66], ["music", 4.96]], [["speech", 63.9], ["music", 4.9], ["explosion", 3.03]], null, [["whack, thwack", 26.01], ["music", 22.96], ["groan", 9.42]], [["throbbing", 19.86], ["fly, housefly", 16.49], ["music", 11.74]], [["music", 42.78], ["hum", 13.51], ["didgeridoo", 6.94]], [["music", 41.78], ["speech", 22.02], ["drum machine", 6.29]]], "duration": [0.93, 0.86, 6.97, 1.21, 3.06, 2.95, 5.63, 0.09, 1.83, 4.41, 18.7, 3.31, 0.86, 6.77, 3.33, 3.51, 4.62]} \ No newline at end of file diff --git a/annotations_filtered/-O3_WO63fhU_filtered.json b/annotations_filtered/-O3_WO63fhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d32906f4241e2d6d94a52e7e84003882015195bf --- /dev/null +++ b/annotations_filtered/-O3_WO63fhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [6.0, 5.81], [11.0, 11.48], [15.0, 14.79], [23.0, 28.34], [35.0, 38.77], [41.0, 43.11], [50.0, 54.35], [59.0, 61.91], [67.0, 72.91], [75.0, 75.74], [78.0, 78.73], [80.0, 87.57], [89.0, 89.16], [95.0, 97.93], [101.0, 101.56], [107.0, 115.45], [119.0, 121.22], [125.0, 126.23], [130.0, 130.22], [133.0, 133.29], [134.0, 135.7], [140.0, 176.47], [178.0, 178.19], [182.0, 185.33], [187.0, 191.17], [192.0, 192.94], [194.0, 194.85], [204.0, 204.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.07, 44.99, 37.25, 39.18, 40.38, 37.86, 0.0, 0.0, 40.38, 0.0, 40.88, 0.0, 38.09, 38.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 36.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 79.66], ["musical instrument", 2.0], ["didgeridoo", 0.96]], [["music", 65.05], ["hum", 8.31], ["musical instrument", 2.7]], [["music", 68.88], ["synthesizer", 4.56], ["musical instrument", 2.29]], [["music", 61.69], ["carnatic music", 11.77], ["singing", 2.48]], [["music", 74.92], ["didgeridoo", 1.85], ["middle eastern music", 1.02]], [["music", 78.6], ["middle eastern music", 2.74], ["singing", 1.72]], null, null, [["music", 78.02], ["didgeridoo", 1.96], ["throbbing", 1.77]], null, [["music", 54.3], ["synthesizer", 5.09], ["hum", 4.18]], null, [["music", 84.71], ["synthetic singing", 2.81], ["male singing", 1.42]], [["music", 83.54], ["singing", 2.6], ["christian music", 0.79]], null, null, null, null, null, null, [["music", 57.63], ["didgeridoo", 7.66], ["theremin", 4.37]], [["music", 65.22], ["carnatic music", 15.29], ["musical instrument", 4.53]], null, null, null], "duration": [0.96, -0.19, 0.48, -0.21, 5.34, 3.77, 2.11, 4.35, 2.91, 5.91, 0.74, 0.73, 7.57, 0.16, 2.93, 0.56, 8.45, 2.22, 1.23, 0.22, 0.29, 1.7, 36.47, 0.19, 3.33, 4.17, 0.94, 0.85, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/-OMiOIbouaA_filtered.json b/annotations_filtered/-OMiOIbouaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a5e4d69b700409de6d051cb8cac0bfa73cd2450 --- /dev/null +++ b/annotations_filtered/-OMiOIbouaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.3], [12.0, 13.78], [15.0, 16.83], [17.0, 26.6], [29.0, 41.88], [43.0, 44.95], [46.0, 48.12], [57.0, 61.13], [62.0, 63.8], [76.0, 76.89], [80.0, 80.7], [83.0, 85.8], [89.0, 89.38], [90.0, 90.83], [92.0, 92.16], [97.0, 98.05], [98.0, 102.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [96.17, 0.0, 0.0, 96.29, 91.64, 0.0, 93.76, 81.53, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.53], ["speech", 9.03], ["telephone", 2.99]]], "duration": [3.3, 1.78, 1.83, 9.6, 12.88, 1.95, 2.12, 4.13, 1.8, 0.89, 0.7, 2.8, 0.38, 0.83, 0.16, 1.05, 4.69]} \ No newline at end of file diff --git a/annotations_filtered/-ON8ZTCiuYo_filtered.json b/annotations_filtered/-ON8ZTCiuYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..075a770f0b5a1d786258cbf7c132015196f070d0 --- /dev/null +++ b/annotations_filtered/-ON8ZTCiuYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.47], [22.0, 22.92], [25.0, 30.74], [32.0, 38.31], [39.0, 39.31], [41.0, 52.03], [55.0, 57.35], [60.0, 65.16], [65.0, 66.8], [69.0, 72.5], [73.0, 75.17], [76.0, 81.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.82, 85.17, 0.0, 86.82, 38.59, 56.33, 0.0, 66.15, 57.09, 68.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 32.95], ["chirp tone", 25.13], ["tuning fork", 17.12]], null, null, null, null, null], "duration": [1.47, 0.92, 5.74, 6.31, 0.31, 11.03, 2.35, 5.16, 1.8, 3.5, 2.17, 5.53]} \ No newline at end of file diff --git a/annotations_filtered/-OUuZojE3aM_filtered.json b/annotations_filtered/-OUuZojE3aM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa20e5defcd05ad72501ff83db73a29986ee2e84 --- /dev/null +++ b/annotations_filtered/-OUuZojE3aM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.02], [33.0, 35.07], [36.0, 100.26], [101.0, 101.66], [102.0, 104.99], [106.0, 132.7], [133.0, 144.86], [146.0, 161.6], [162.0, 161.64], [162.0, 161.72], [162.0, 161.77], [162.0, 162.01], [162.0, 162.06], [162.0, 162.13], [162.0, 162.16], [162.0, 162.3], [162.0, 162.45], [162.0, 162.48], [164.0, 168.07]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 70.16, 0.0, 0.0, 38.05, 44.2, 63.74, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, null, [["speech", 65.43], ["music", 11.35], ["inside, small room", 3.15]], [["music", 33.49], ["synthesizer", 10.78], ["sine wave", 7.62]], null, [["music", 49.94], ["theremin", 12.22], ["singing bowl", 7.74]], null, null, null, null, null, null, null, null, null, null, [["whimper", 30.1], ["speech", 8.43], ["groan", 7.73]]], "duration": [1.02, 2.07, 64.26, 0.66, 2.99, 26.7, 11.86, 15.6, -0.36, -0.28, -0.23, 0.01, 0.06, 0.13, 0.16, 0.3, 0.45, 0.48, 4.07]} \ No newline at end of file diff --git a/annotations_filtered/-Ot948zIr0s_filtered.json b/annotations_filtered/-Ot948zIr0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26b9d326e2c5cdcc358bdfc769e8dd43c7850603 --- /dev/null +++ b/annotations_filtered/-Ot948zIr0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [4.0, 4.46], [13.0, 13.61], [16.0, 16.61], [17.0, 17.76], [19.0, 18.94], [20.0, 20.75], [23.0, 24.22], [26.0, 28.92], [30.0, 30.1], [32.0, 32.12], [47.0, 48.84], [55.0, 56.08], [59.0, 59.44], [62.0, 63.66], [69.0, 69.03], [84.0, 84.84], [88.0, 88.77], [94.0, 94.91], [97.0, 97.97], [103.0, 103.13], [106.0, 107.01], [109.0, 110.37], [116.0, 117.56], [119.0, 120.41], [123.0, 124.75], [127.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.46, 0.61, 0.61, 0.76, -0.06, 0.75, 1.22, 2.92, 0.1, 0.12, 1.84, 1.08, 0.44, 1.66, 0.03, 0.84, 0.77, 0.91, 0.97, 0.13, 1.01, 1.37, 1.56, 1.41, 1.75, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/-PFdr0SiAEw_filtered.json b/annotations_filtered/-PFdr0SiAEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..beeee57ece8bd730dfece209dd8d4de4b0f7f675 --- /dev/null +++ b/annotations_filtered/-PFdr0SiAEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.21], [10.0, 11.33], [13.0, 12.66], [26.0, 26.08], [28.0, 28.86], [30.0, 30.94], [34.0, 35.23], [36.0, 40.73], [41.0, 41.5], [43.0, 44.02], [45.0, 45.74], [49.0, 49.33], [52.0, 53.27], [56.0, 56.39], [58.0, 94.22], [96.0, 96.28], [97.0, 101.33], [102.0, 103.15], [104.0, 106.51], [116.0, 116.51], [118.0, 120.24], [123.0, 125.09], [128.0, 129.51], [136.0, 137.54], [145.0, 148.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 98.8, 0.0, 65.67, 90.95, 0.0, 0.0, 86.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 49.53], ["double bass", 17.3], ["musical instrument", 7.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 1.33, -0.34, 0.08, 0.86, 0.94, 1.23, 4.73, 0.5, 1.02, 0.74, 0.33, 1.27, 0.39, 36.22, 0.28, 4.33, 1.15, 2.51, 0.51, 2.24, 2.09, 1.51, 1.54, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/-Pf1f0pZdnQ_filtered.json b/annotations_filtered/-Pf1f0pZdnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc5b456314009e4b726b885d6cb79b8523a680e --- /dev/null +++ b/annotations_filtered/-Pf1f0pZdnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 101.44], [103.0, 103.62], [105.0, 106.83], [107.0, 107.69], [111.0, 124.53]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.12], "audiomae_on_audioset": [null, null, null, null, [["music", 47.32], ["hum", 8.78], ["synthesizer", 7.92]]], "duration": [99.44, 0.62, 1.83, 0.69, 13.53]} \ No newline at end of file diff --git a/annotations_filtered/-QB2gXiOAKc_filtered.json b/annotations_filtered/-QB2gXiOAKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fa3c706b858c5d3ded27170bcc2b4f5f3e647a3 --- /dev/null +++ b/annotations_filtered/-QB2gXiOAKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [11.0, 12.26], [13.0, 14.57], [17.0, 22.94], [29.0, 32.91], [35.0, 47.33]], "keep_status": [false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 59.59, 47.98, 45.3], "audiomae_on_audioset": [null, null, null, null, [["singing bowl", 58.17], ["music", 4.91], ["tuning fork", 4.51]], [["hum", 25.52], ["speech", 16.82], ["didgeridoo", 13.0]]], "duration": [1.13, 1.26, 1.57, 5.94, 3.91, 12.33]} \ No newline at end of file diff --git a/annotations_filtered/-QJsljIDKkk_filtered.json b/annotations_filtered/-QJsljIDKkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b58f9d3c0028268368142eacca9b5dbeb4860895 --- /dev/null +++ b/annotations_filtered/-QJsljIDKkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.46], [9.0, 9.32], [12.0, 12.82], [20.0, 21.05], [22.0, 23.08], [24.0, 25.62], [27.0, 27.67], [29.0, 29.89], [31.0, 31.6], [33.0, 33.47], [37.0, 37.45], [42.0, 42.89], [44.0, 44.1], [50.0, 50.79], [51.0, 52.66], [53.0, 54.6], [55.0, 56.35], [61.0, 62.24], [63.0, 64.83], [67.0, 66.65], [76.0, 78.39], [80.0, 80.7], [82.0, 82.73], [84.0, 84.67], [85.0, 86.36], [88.0, 89.28], [90.0, 90.85], [95.0, 96.48], [99.0, 99.99], [100.0, 105.12], [107.0, 108.35], [110.0, 110.07], [111.0, 112.56], [113.0, 113.66], [116.0, 116.5], [118.0, 119.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.46, 0.32, 0.82, 1.05, 1.08, 1.62, 0.67, 0.89, 0.6, 0.47, 0.45, 0.89, 0.1, 0.79, 1.66, 1.6, 1.35, 1.24, 1.83, -0.35, 2.39, 0.7, 0.73, 0.67, 1.36, 1.28, 0.85, 1.48, 0.99, 5.12, 1.35, 0.07, 1.56, 0.66, 0.5, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/-QNxYSDdpig_filtered.json b/annotations_filtered/-QNxYSDdpig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..910d4229dd3d213ab887fdd8afc0bebd46c43b8b --- /dev/null +++ b/annotations_filtered/-QNxYSDdpig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [9.0, 8.73], [19.0, 20.98], [22.0, 25.22], [26.0, 28.49], [31.0, 31.7], [35.0, 35.14], [36.0, 38.74], [41.0, 43.17], [44.0, 44.54], [46.0, 46.36], [48.0, 48.0], [50.0, 50.45], [51.0, 51.58], [56.0, 56.32], [60.0, 60.44], [66.0, 66.31], [71.0, 71.2], [72.0, 72.79], [76.0, 75.88], [78.0, 78.65], [91.0, 91.64], [92.0, 92.6], [93.0, 95.01], [108.0, 109.05], [110.0, 111.72], [113.0, 115.05], [118.0, 118.79], [125.0, 125.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.73, 89.19, 0.0, 0.0, 69.74, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 43.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.31], ["sidetone", 25.91], ["dial tone", 6.77]], null, null], "duration": [1.97, -0.27, 1.98, 3.22, 2.49, 0.7, 0.14, 2.74, 2.17, 0.54, 0.36, 0.0, 0.45, 0.58, 0.32, 0.44, 0.31, 0.2, 0.79, -0.12, 0.65, 0.64, 0.6, 2.01, 1.05, 1.72, 2.05, 0.79, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/-QOahlrO8Yo_filtered.json b/annotations_filtered/-QOahlrO8Yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24892188af2f2b20b65c2a738b2172b6d0c49d05 --- /dev/null +++ b/annotations_filtered/-QOahlrO8Yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 46.85], [48.0, 55.66], [56.0, 55.8], [56.0, 55.95], [56.0, 154.8]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 30.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["noise", 24.48], ["music", 20.3], ["speech", 9.45]], null, null, null], "duration": [40.85, 7.66, -0.2, -0.05, 98.8]} \ No newline at end of file diff --git a/annotations_filtered/-QT_Af7RLjU_filtered.json b/annotations_filtered/-QT_Af7RLjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7788ef1ed1d4e273f4874a283cc243ea98b543b8 --- /dev/null +++ b/annotations_filtered/-QT_Af7RLjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.73], [17.0, 18.45], [23.0, 24.22], [34.0, 34.18], [38.0, 38.35], [42.0, 41.71], [42.0, 42.01], [48.0, 52.41], [57.0, 57.13], [58.0, 59.0], [66.0, 66.19], [69.0, 68.91], [74.0, 76.0], [79.0, 80.03], [82.0, 83.15], [84.0, 94.04], [102.0, 101.65], [102.0, 101.76], [113.0, 113.32], [122.0, 130.72], [133.0, 133.84]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 37.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 27.06], ["animal", 11.71], ["whale vocalization", 10.93]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.45], ["whack, thwack", 3.97], ["breaking", 2.23]], null], "duration": [8.73, 1.45, 1.22, 0.18, 0.35, -0.29, 0.01, 4.41, 0.13, 1.0, 0.19, -0.09, 2.0, 1.03, 1.15, 10.04, -0.35, -0.24, 0.32, 8.72, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/-QWL-FwX4t4_filtered.json b/annotations_filtered/-QWL-FwX4t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed47653c79b2867cd36add35d27fa2ec0b93bdc7 --- /dev/null +++ b/annotations_filtered/-QWL-FwX4t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.25], [27.0, 29.24], [30.0, 34.38], [35.0, 35.45], [36.0, 37.29], [38.0, 39.31], [40.0, 44.25], [45.0, 52.74], [54.0, 56.64], [58.0, 60.64], [61.0, 61.92], [63.0, 64.84], [67.0, 68.67], [70.0, 72.62], [75.0, 76.27], [77.0, 77.8], [78.0, 80.2], [80.0, 88.87], [100.0, 100.16], [101.0, 101.51], [110.0, 112.35], [113.0, 118.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [68.41, 63.64, 87.0, 0.0, 0.0, 0.0, 49.36, 71.57, 90.25, 68.02, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 61.47, 62.99, 0.0, 0.0, 90.25, 45.3], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 20.14], ["noise", 10.95], ["hum", 9.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 36.91], ["hum", 21.39], ["music", 9.18]]], "duration": [2.25, 2.24, 4.38, 0.45, 1.29, 1.31, 4.25, 7.74, 2.64, 2.64, 0.92, 1.84, 1.67, 2.62, 1.27, 0.8, 2.2, 8.87, 0.16, 0.51, 2.35, 5.02]} \ No newline at end of file diff --git a/annotations_filtered/-QZzReak2Ck_filtered.json b/annotations_filtered/-QZzReak2Ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f501243593b30206a753e9cba39bc3e03a6c6c6 --- /dev/null +++ b/annotations_filtered/-QZzReak2Ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 93.02], [96.0, 97.28], [98.0, 101.12], [101.0, 103.42], [104.0, 104.9], [106.0, 107.84], [109.0, 113.1], [114.0, 114.67], [118.0, 120.85], [122.0, 121.85], [123.0, 151.38], [151.0, 151.41], [151.0, 151.44], [151.0, 151.48], [153.0, 156.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.12, 0.0, 66.03, 54.17, 0.0, 0.0, 72.31, 0.0, 35.37, 0.0, 32.58, 0.0, 0.0, 0.0, 81.71], "audiomae_on_audioset": [[["music", 43.13], ["throbbing", 20.27], ["hum", 15.46]], null, null, null, null, null, null, null, [["music", 73.1], ["speech", 5.41], ["didgeridoo", 4.54]], null, [["music", 50.95], ["speech", 24.54], ["whack, thwack", 2.62]], null, null, null, null], "duration": [20.02, 1.28, 3.12, 2.42, 0.9, 1.84, 4.1, 0.67, 2.85, -0.15, 28.38, 0.41, 0.44, 0.48, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/-QfKnft9uWY_filtered.json b/annotations_filtered/-QfKnft9uWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f9ad0e8bb42e557f458ba1e211ad1579195c763 --- /dev/null +++ b/annotations_filtered/-QfKnft9uWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 76.37], [76.0, 76.4], [83.0, 87.86], [90.0, 95.49], [100.0, 141.94], [144.0, 149.89]], "keep_status": [false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 35.27, 39.77, 0.0, 31.75], "audiomae_on_audioset": [null, null, [["speech", 42.89], ["radio", 15.68], ["sidetone", 7.55]], [["fart", 25.2], ["speech", 23.95], ["fly, housefly", 8.6]], null, [["fart", 49.09], ["music", 8.72], ["sound effect", 4.1]]], "duration": [0.37, 0.4, 4.86, 5.49, 41.94, 5.89]} \ No newline at end of file diff --git a/annotations_filtered/-Qq6ZZy0yGg_filtered.json b/annotations_filtered/-Qq6ZZy0yGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49b0e01737c527b5ab3fa59f2e7d8433c7af6517 --- /dev/null +++ b/annotations_filtered/-Qq6ZZy0yGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [3.0, 2.98], [7.0, 7.15], [13.0, 16.6], [17.0, 18.42], [22.0, 23.35], [26.0, 30.0], [36.0, 37.71], [45.0, 50.68], [61.0, 85.45], [85.0, 85.51], [88.0, 121.51], [127.0, 166.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.34, 0.0, 0.0, 29.25, 0.0, 29.51, 29.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.78], ["speech", 24.0], ["sidetone", 3.84]], null, null, [["music", 76.68], ["musical instrument", 4.58], ["speech", 2.85]], null, [["music", 74.26], ["boing", 4.46], ["musical instrument", 4.37]], [["music", 81.65], ["didgeridoo", 3.24], ["musical instrument", 1.66]], null, null, null], "duration": [0.61, -0.02, 0.15, 3.6, 1.42, 1.35, 4.0, 1.71, 5.68, 24.45, 0.51, 33.51, 39.8]} \ No newline at end of file diff --git a/annotations_filtered/-RBjiJto4hc_filtered.json b/annotations_filtered/-RBjiJto4hc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d24195a12f36c399830a7193998b81cd53b0e26a --- /dev/null +++ b/annotations_filtered/-RBjiJto4hc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.34], [19.0, 20.38], [36.0, 41.17], [42.0, 42.63], [43.0, 42.67], [43.0, 43.65], [44.0, 44.31], [44.0, 44.34], [44.0, 45.1], [49.0, 49.45], [50.0, 52.78], [54.0, 55.65], [56.0, 61.65], [63.0, 66.11], [68.0, 80.84]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [30.34, 0.0, 30.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 84.98, 46.64, 35.07], "audiomae_on_audioset": [[["vehicle", 17.86], ["moo", 14.13], ["speech", 10.38]], null, [["foghorn", 34.48], ["speech", 20.86], ["music", 12.71]], null, null, null, null, null, null, null, null, null, null, [["music", 40.1], ["ambient music", 7.64], ["foghorn", 6.24]], [["music", 53.31], ["theremin", 10.71], ["musical instrument", 5.24]]], "duration": [3.34, 1.38, 5.17, 0.63, -0.33, 0.65, 0.31, 0.34, 1.1, 0.45, 2.78, 1.65, 5.65, 3.11, 12.84]} \ No newline at end of file diff --git a/annotations_filtered/-RJ6USD2nEU_filtered.json b/annotations_filtered/-RJ6USD2nEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec8a87e4867da461dce256b41476ea691ac50e8e --- /dev/null +++ b/annotations_filtered/-RJ6USD2nEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.91], [8.0, 15.75], [30.0, 31.4], [33.0, 33.1], [34.0, 34.64], [38.0, 38.38], [43.0, 43.6], [45.0, 45.54], [56.0, 63.9], [76.0, 80.3], [83.0, 83.96], [84.0, 89.95], [90.0, 90.44], [90.0, 91.13], [93.0, 100.65], [102.0, 103.64], [107.0, 109.39], [115.0, 120.77], [127.0, 127.68], [131.0, 133.57], [137.0, 138.64], [139.0, 139.29], [149.0, 149.86], [152.0, 154.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 62.37, 0.0, 33.04, 0.0, 0.0, 47.54, 0.0, 45.69, 46.05, 0.0, 46.61, 0.0, 0.0, 0.0, 58.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 39.21], ["animal", 10.42], ["breaking", 5.16]], null, null, [["fly, housefly", 38.31], ["bee, wasp, etc.", 35.73], ["insect", 14.6]], null, [["music", 49.28], ["throbbing", 5.06], ["hum", 3.83]], [["fly, housefly", 17.39], ["noise", 15.69], ["hum", 7.02]], null, [["hum", 43.42], ["mains hum", 18.79], ["music", 9.52]], null, null, null, null], "duration": [-0.09, 7.75, 1.4, 0.1, 0.64, 0.38, 0.6, 0.54, 7.9, 4.3, 0.96, 5.95, 0.44, 1.13, 7.65, 1.64, 2.39, 5.77, 0.68, 2.57, 1.64, 0.29, 0.86, 2.84]} \ No newline at end of file diff --git a/annotations_filtered/-RhmDUj_GJs_filtered.json b/annotations_filtered/-RhmDUj_GJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd638db8da00da96e713bbcded882355e50d903 --- /dev/null +++ b/annotations_filtered/-RhmDUj_GJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.02], [31.0, 32.09], [36.0, 37.83], [51.0, 52.07], [54.0, 55.29], [58.0, 60.89], [77.0, 77.67], [80.0, 80.86], [88.0, 89.55]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.02, 1.09, 1.83, 1.07, 1.29, 2.89, 0.67, 0.86, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/-RuK7XKbefY_filtered.json b/annotations_filtered/-RuK7XKbefY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b3fe28878d4c62dd661fa15a7a0bd8989f5fbc6 --- /dev/null +++ b/annotations_filtered/-RuK7XKbefY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.27], [6.0, 8.7], [12.0, 14.44], [17.0, 19.04], [23.0, 25.37], [27.0, 28.95], [31.0, 33.98], [43.0, 43.75], [48.0, 48.12], [73.0, 110.79], [113.0, 113.64], [118.0, 118.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.68, 99.96, 94.66, 98.51, 90.08, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 2.7, 2.44, 2.04, 2.37, 1.95, 2.98, 0.75, 0.12, 37.79, 0.64, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/-SJAzpHg4s8_filtered.json b/annotations_filtered/-SJAzpHg4s8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-SJAzpHg4s8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-SKfkvvtqN0_filtered.json b/annotations_filtered/-SKfkvvtqN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da3b7be8a150d281e33da2dfdf2dd54c73d3cc91 --- /dev/null +++ b/annotations_filtered/-SKfkvvtqN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 21.68], [35.0, 35.43], [39.0, 39.92], [42.0, 42.45], [47.0, 49.1], [49.0, 49.15], [49.0, 49.92], [55.0, 57.03], [70.0, 70.28], [74.0, 74.6], [76.0, 76.52], [81.0, 104.11], [106.0, 105.8], [108.0, 108.43], [135.0, 135.43], [145.0, 145.49], [147.0, 149.57], [152.0, 154.5], [161.0, 161.89], [163.0, 163.65]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [32.24, 0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 37.07, 0.0, 0.0, 0.0, 0.0, 35.74, 37.56, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.06], ["brass instrument", 17.19], ["saxophone", 9.1]], null, null, null, [["mosquito", 35.35], ["fly, housefly", 31.42], ["insect", 13.07]], null, null, [["hum", 36.85], ["throbbing", 19.46], ["music", 12.17]], null, null, null, [["music", 53.1], ["buzz", 12.2], ["bleat", 3.12]], null, null, null, null, [["music", 25.42], ["carnatic music", 24.13], ["speech", 7.78]], [["music", 42.27], ["chant", 6.75], ["musical instrument", 4.14]], null, null], "duration": [15.68, 0.43, 0.92, 0.45, 2.1, 0.15, 0.92, 2.03, 0.28, 0.6, 0.52, 23.11, -0.2, 0.43, 0.43, 0.49, 2.57, 2.5, 0.89, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/-SkeK7t74oo_filtered.json b/annotations_filtered/-SkeK7t74oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcf489bd3df204f55f91965ad7f8abeae845625e --- /dev/null +++ b/annotations_filtered/-SkeK7t74oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.29], [14.0, 15.6], [16.0, 16.36], [17.0, 23.04], [33.0, 33.61], [40.0, 41.99], [45.0, 44.93], [47.0, 51.95], [60.0, 72.52], [82.0, 83.03], [88.0, 94.61], [99.0, 104.11], [105.0, 114.79], [118.0, 119.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 31.13, 32.7, 0.0, 33.21, 33.52, 34.03, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 53.63], ["speech", 13.05], ["saxophone", 3.62]], null, null, null, [["sidetone", 62.27], ["music", 15.8], ["throbbing", 3.05]], [["music", 47.52], ["speech", 27.62], ["sidetone", 5.08]], null, [["music", 61.33], ["sidetone", 11.47], ["speech", 6.25]], [["music", 60.48], ["house music", 4.09], ["sampler", 2.07]], [["music", 57.62], ["hum", 9.52], ["saxophone", 3.15]], null], "duration": [1.29, 1.6, 0.36, 6.04, 0.61, 1.99, -0.07, 4.95, 12.52, 1.03, 6.61, 5.11, 9.79, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/-Svsz19yyPM_filtered.json b/annotations_filtered/-Svsz19yyPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a14767bfb84cdc1d7c5e205bbffecf99bf5639f --- /dev/null +++ b/annotations_filtered/-Svsz19yyPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.4], [9.0, 9.22], [11.0, 18.03], [19.0, 19.53], [21.0, 28.49], [31.0, 76.1], [78.0, 81.51], [84.0, 92.16], [94.0, 99.94], [102.0, 102.32], [103.0, 103.5], [106.0, 105.85], [106.0, 106.84], [109.0, 109.0], [111.0, 111.48], [112.0, 114.94], [120.0, 121.19], [123.0, 124.21], [126.0, 140.12], [141.0, 149.39], [153.0, 155.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 96.04, 0.0, 51.39, 0.0, 89.54, 68.67, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 45.46, 42.88, 45.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.66], ["sampler", 4.29], ["drum machine", 4.04]], [["music", 46.72], ["hum", 17.85], ["throbbing", 13.36]], [["beatboxing", 56.92], ["music", 17.26], ["speech", 6.22]]], "duration": [2.4, 0.22, 7.03, 0.53, 7.49, 45.1, 3.51, 8.16, 5.94, 0.32, 0.5, -0.15, 0.84, 0.0, 0.48, 2.94, 1.19, 1.21, 14.12, 8.39, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/-T16rxR-nCo_filtered.json b/annotations_filtered/-T16rxR-nCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08732ecd88d7a220469605234056a87105b4a049 --- /dev/null +++ b/annotations_filtered/-T16rxR-nCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [15.0, 15.09], [17.0, 17.2], [19.0, 20.14], [27.0, 26.97], [34.0, 35.04], [40.0, 42.89], [46.0, 46.11], [49.0, 49.94], [53.0, 53.5], [56.0, 56.83], [59.0, 59.95], [61.0, 63.02], [69.0, 70.11], [76.0, 76.42], [78.0, 78.61], [86.0, 86.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.09, 0.2, 1.14, -0.03, 1.04, 2.89, 0.11, 0.94, 0.5, 0.83, 0.95, 2.02, 1.11, 0.42, 0.61, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/-TLCaDbBv_s_filtered.json b/annotations_filtered/-TLCaDbBv_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3f9fd8d7790e6d2209b837a62fa4699b21708c7 --- /dev/null +++ b/annotations_filtered/-TLCaDbBv_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.74], [9.0, 10.42], [12.0, 13.61], [16.0, 16.6], [18.0, 18.71], [20.0, 21.46], [22.0, 23.6], [26.0, 26.33], [29.0, 30.47], [31.0, 32.48], [34.0, 35.75], [38.0, 38.77], [41.0, 42.48], [45.0, 45.49], [47.0, 47.38], [49.0, 49.81], [51.0, 52.07], [54.0, 55.17], [61.0, 61.67], [65.0, 67.56], [69.0, 71.22], [74.0, 74.36], [76.0, 76.44], [77.0, 77.04], [77.0, 79.3], [82.0, 82.22], [94.0, 95.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 57.72, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.55], ["music", 22.67], ["hum", 3.02]], null, null], "duration": [2.74, 1.42, 1.61, 0.6, 0.71, 1.46, 1.6, 0.33, 1.47, 1.48, 1.75, 0.77, 1.48, 0.49, 0.38, 0.81, 1.07, 1.17, 0.67, 2.56, 2.22, 0.36, 0.44, 0.04, 2.3, 0.22, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/-TPRG6Yqzf4_filtered.json b/annotations_filtered/-TPRG6Yqzf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed9992f7ae8cce3c04d11965b6803a1ce4bcb5b6 --- /dev/null +++ b/annotations_filtered/-TPRG6Yqzf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [3.0, 9.21], [16.0, 19.08], [20.0, 21.47], [23.0, 23.75], [36.0, 37.0], [40.0, 40.76], [44.0, 45.01], [47.0, 48.54], [50.0, 53.23], [54.0, 67.8], [73.0, 83.81], [84.0, 83.84], [85.0, 96.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 87.19, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 46.02, 35.46, 0.0, 34.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 37.04], ["music", 23.48], ["hum", 4.3]], [["music", 43.05], ["musical instrument", 14.6], ["speech", 6.81]], null, [["livestock, farm animals, working animals", 43.97], ["cattle, bovinae", 38.13], ["moo", 17.4]]], "duration": [0.67, 6.21, 3.08, 1.47, 0.75, 1.0, 0.76, 1.01, 1.54, 3.23, 13.8, 10.81, -0.16, 11.15]} \ No newline at end of file diff --git a/annotations_filtered/-TWsZukTS4Q_filtered.json b/annotations_filtered/-TWsZukTS4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-TWsZukTS4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-TogGxzlfhM_filtered.json b/annotations_filtered/-TogGxzlfhM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91af0000c918eb9ae29ea21404d2bca9e6a1a899 --- /dev/null +++ b/annotations_filtered/-TogGxzlfhM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [14.0, 15.04], [16.0, 16.5], [19.0, 18.99], [27.0, 27.19], [30.0, 30.23], [32.0, 32.88], [35.0, 35.33], [37.0, 37.3], [42.0, 43.48], [53.0, 53.74], [78.0, 78.38], [109.0, 109.7], [111.0, 111.4], [118.0, 117.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.04, 0.5, -0.01, 0.19, 0.23, 0.88, 0.33, 0.3, 1.48, 0.74, 0.38, 0.7, 0.4, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/-TzrPYcpPvY_filtered.json b/annotations_filtered/-TzrPYcpPvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f26210b5b96df24dc46f20ee25b366181223a38f --- /dev/null +++ b/annotations_filtered/-TzrPYcpPvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.07], [23.0, 24.63], [25.0, 25.14], [29.0, 37.81], [49.0, 57.82], [60.0, 60.83], [68.0, 68.54], [69.0, 76.45], [78.0, 89.45], [93.0, 92.65], [95.0, 96.72], [105.0, 121.69], [124.0, 132.73]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.52, 0.0, 0.0, 39.98, 38.9, 0.0, 0.0, 44.55, 40.66, 0.0, 0.0, 42.15, 69.34], "audiomae_on_audioset": [[["music", 25.92], ["musical instrument", 14.38], ["guitar", 10.44]], null, null, [["music", 74.16], ["theremin", 4.42], ["musical instrument", 2.98]], [["music", 82.24], ["theremin", 4.65], ["musical instrument", 1.81]], null, null, [["music", 69.25], ["musical instrument", 6.25], ["guitar", 2.75]], [["music", 77.09], ["musical instrument", 3.0], ["theremin", 2.49]], null, null, [["music", 79.09], ["theremin", 4.04], ["singing", 2.97]], null], "duration": [2.07, 1.63, 0.14, 8.81, 8.82, 0.83, 0.54, 7.45, 11.45, -0.35, 1.72, 16.69, 8.73]} \ No newline at end of file diff --git a/annotations_filtered/-U9v7Nz6hOs_filtered.json b/annotations_filtered/-U9v7Nz6hOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56cf3546c26581878023e636a38a6bda01c7c784 --- /dev/null +++ b/annotations_filtered/-U9v7Nz6hOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [9.0, 10.74], [12.0, 12.11], [13.0, 14.52], [17.0, 23.11], [34.0, 55.49], [56.0, 64.27], [65.0, 67.34], [69.0, 68.91], [70.0, 70.88], [72.0, 85.77], [90.0, 89.95], [91.0, 91.0], [93.0, 98.34], [105.0, 120.36], [125.0, 126.33], [128.0, 134.54], [140.0, 140.73], [155.0, 155.34]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.42, 28.95, 29.06, 29.26, 0.0, 0.0, 29.05, 0.0, 0.0, 30.22, 30.86, 0.0, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.5], ["quack", 6.9], ["livestock, farm animals, working animals", 2.75]], [["music", 53.48], ["speech", 18.34], ["electronic music", 10.32]], [["music", 12.99], ["vehicle", 11.55], ["whale vocalization", 8.26]], [["boing", 37.71], ["moo", 26.01], ["cattle, bovinae", 22.73]], null, null, [["music", 24.18], ["speech", 15.5], ["whip", 11.98]], null, null, [["speech", 60.38], ["hum", 12.69], ["music", 5.85]], [["music", 22.26], ["hum", 18.96], ["throbbing", 14.4]], null, [["music", 69.37], ["theremin", 10.04], ["musical instrument", 4.35]], null, null], "duration": [1.0, 1.74, 0.11, 1.52, 6.11, 21.49, 8.27, 2.34, -0.09, 0.88, 13.77, -0.05, 0.0, 5.34, 15.36, 1.33, 6.54, 0.73, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/-UAElWXbk3I_filtered.json b/annotations_filtered/-UAElWXbk3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76275b947851958bae07e84d737f968a55300991 --- /dev/null +++ b/annotations_filtered/-UAElWXbk3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.39], [16.0, 33.0], [35.0, 34.94], [37.0, 37.44], [39.0, 38.97], [40.0, 41.45], [44.0, 47.7], [48.0, 49.54], [50.0, 50.79], [58.0, 59.21], [61.0, 61.28], [65.0, 66.12], [67.0, 67.59], [69.0, 74.24], [76.0, 84.28], [87.0, 86.9], [90.0, 90.42], [93.0, 98.51], [99.0, 101.39], [102.0, 107.89], [109.0, 112.82], [114.0, 115.13], [116.0, 116.72], [118.0, 118.89], [121.0, 121.59], [124.0, 123.99], [125.0, 125.71], [126.0, 126.35], [128.0, 127.6], [128.0, 127.75], [129.0, 128.88], [131.0, 131.08], [139.0, 139.97], [142.0, 142.87], [143.0, 143.48], [147.0, 146.99], [148.0, 149.54], [152.0, 152.46], [161.0, 160.74], [166.0, 166.28], [170.0, 170.21], [172.0, 173.58], [175.0, 176.54], [177.0, 178.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.88, 29.83, 0.0, 0.0, 0.0, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 31.21, 0.0, 0.0, 62.58, 74.76, 75.07, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.08], ["speech", 14.77], ["crack", 4.28]], [["music", 69.76], ["speech", 11.07], ["sampler", 1.87]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.63], ["speech", 6.21], ["livestock, farm animals, working animals", 4.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.39, 17.0, -0.06, 0.44, -0.03, 1.45, 3.7, 1.54, 0.79, 1.21, 0.28, 1.12, 0.59, 5.24, 8.28, -0.1, 0.42, 5.51, 2.39, 5.89, 3.82, 1.13, 0.72, 0.89, 0.59, -0.01, 0.71, 0.35, -0.4, -0.25, -0.12, 0.08, 0.97, 0.87, 0.48, -0.01, 1.54, 0.46, -0.26, 0.28, 0.21, 1.58, 1.54, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/-UAV4O9oZy0_filtered.json b/annotations_filtered/-UAV4O9oZy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bb2165d42aee4bfdd1b069bb20c2d35607f1fe7 --- /dev/null +++ b/annotations_filtered/-UAV4O9oZy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 33.24], [37.0, 37.1]], "keep_status": [true, false], "silence_prob": [34.61, 0.0], "audiomae_on_audioset": [[["music", 34.97], ["guitar", 16.89], ["effects unit", 6.65]], null], "duration": [6.24, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/-UJ9K8lMxPA_filtered.json b/annotations_filtered/-UJ9K8lMxPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..885f0eae95dd59d3d0e8c459def74f7906823794 --- /dev/null +++ b/annotations_filtered/-UJ9K8lMxPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.99], [15.0, 15.82], [17.0, 22.67], [25.0, 25.93], [29.0, 123.5], [124.0, 128.92], [132.0, 170.87], [171.0, 172.81]], "keep_status": [false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.65, 0.0, 0.0, 30.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 46.87], ["effects unit", 8.81], ["synthesizer", 6.87]], null, null, [["music", 47.12], ["speech", 10.17], ["cacophony", 3.97]], null, null], "duration": [1.99, 0.82, 5.67, 0.93, 94.5, 4.92, 38.87, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/-UZY16_K3Pw_filtered.json b/annotations_filtered/-UZY16_K3Pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aa3d2cd0d08cfcbf89261180e03364ece4162a0 --- /dev/null +++ b/annotations_filtered/-UZY16_K3Pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.69], [28.0, 29.56], [32.0, 32.32], [37.0, 37.86], [41.0, 43.46], [46.0, 46.58], [48.0, 48.25], [48.0, 51.29], [53.0, 53.15], [57.0, 57.5], [61.0, 60.98], [78.0, 78.41], [82.0, 83.34], [85.0, 85.56], [88.0, 89.02], [93.0, 96.85], [98.0, 98.31], [99.0, 99.44], [101.0, 101.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.7, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.69, 1.56, 0.32, 0.86, 2.46, 0.58, 0.25, 3.29, 0.15, 0.5, -0.02, 0.41, 1.34, 0.56, 1.02, 3.85, 0.31, 0.44, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/-U_IRXhodds_filtered.json b/annotations_filtered/-U_IRXhodds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfcfb5b9a8201a2e174d79d66ce56d6fc449e395 --- /dev/null +++ b/annotations_filtered/-U_IRXhodds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [5.0, 5.0], [7.0, 7.75], [9.0, 18.4], [19.0, 19.16], [27.0, 27.36], [29.0, 34.64], [35.0, 69.42], [71.0, 73.89], [75.0, 75.37], [80.0, 84.37], [85.0, 85.16], [87.0, 87.34], [87.0, 87.51], [88.0, 88.15], [93.0, 95.88], [97.0, 97.75], [99.0, 102.03], [108.0, 112.36], [116.0, 115.89], [118.0, 129.71], [137.0, 150.94], [153.0, 176.5]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.04, 0.0, 0.0, 32.82, 0.0, 32.13, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 29.02, 0.0, 32.54, 29.63, 0.0, 29.76, 30.02, 30.68], "audiomae_on_audioset": [null, null, null, [["speech", 68.53], ["music", 17.4], ["explosion", 3.7]], null, null, [["cattle, bovinae", 40.79], ["moo", 30.43], ["livestock, farm animals, working animals", 24.18]], null, [["music", 39.65], ["throbbing", 19.19], ["hum", 5.86]], null, null, null, null, null, null, [["music", 51.01], ["throbbing", 8.86], ["electronic music", 3.87]], null, [["music", 56.1], ["throbbing", 7.76], ["speech", 5.67]], [["music", 29.31], ["throbbing", 13.46], ["speech", 6.56]], null, [["music", 55.2], ["speech", 19.25], ["fly, housefly", 2.99]], [["music", 44.89], ["speech", 42.66], ["synthesizer", 1.72]], [["music", 72.26], ["throbbing", 7.18], ["electronic music", 4.65]]], "duration": [0.08, 0.0, 0.75, 9.4, 0.16, 0.36, 5.64, 34.42, 2.89, 0.37, 4.37, 0.16, 0.34, 0.51, 0.15, 2.88, 0.75, 3.03, 4.36, -0.11, 11.71, 13.94, 23.5]} \ No newline at end of file diff --git a/annotations_filtered/-VnQ_KpOBm4_filtered.json b/annotations_filtered/-VnQ_KpOBm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f079584b443ce674c1baac66acb4876a298c1645 --- /dev/null +++ b/annotations_filtered/-VnQ_KpOBm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 6.37], [13.0, 13.83], [17.0, 18.18], [19.0, 19.92], [27.0, 27.75], [29.0, 30.13], [34.0, 34.05], [35.0, 35.58], [41.0, 42.55], [46.0, 46.6], [49.0, 50.14], [51.0, 51.14], [52.0, 52.86], [54.0, 55.53], [57.0, 57.16], [62.0, 62.06], [63.0, 64.45], [66.0, 66.7], [69.0, 69.74], [72.0, 72.62], [76.0, 76.57], [79.0, 80.2], [82.0, 84.45], [88.0, 88.94], [91.0, 91.25], [92.0, 92.21], [94.0, 94.34], [96.0, 96.82], [100.0, 100.18], [103.0, 103.4], [106.0, 106.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.03], ["musical instrument", 13.94], ["guitar", 13.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.35], ["speech", 8.29], ["musical instrument", 4.71]], null, null, null, null, null, null, null, null], "duration": [0.13, 2.37, 0.83, 1.18, 0.92, 0.75, 1.13, 0.05, 0.58, 1.55, 0.6, 1.14, 0.14, 0.86, 1.53, 0.16, 0.06, 1.45, 0.7, 0.74, 0.62, 0.57, 1.2, 2.45, 0.94, 0.25, 0.21, 0.34, 0.82, 0.18, 0.4, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/-W8pOz1fsD0_filtered.json b/annotations_filtered/-W8pOz1fsD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01c367440a68d880637feb64392e6740bd31d09c --- /dev/null +++ b/annotations_filtered/-W8pOz1fsD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 44.96], [45.0, 45.08], [46.0, 63.59], [65.0, 70.41], [72.0, 73.09]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.42, 32.94, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.68], ["throbbing", 6.95], ["hum", 5.56]], [["music", 33.15], ["throbbing", 20.68], ["hum", 14.39]], null], "duration": [40.96, 0.08, 17.59, 5.41, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/-WN4uZXOltk_filtered.json b/annotations_filtered/-WN4uZXOltk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f81123a2b5097a2cbe9f5c7c8ef50ce827f7c6fb --- /dev/null +++ b/annotations_filtered/-WN4uZXOltk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 29.46], [31.0, 37.72], [38.0, 51.81], [54.0, 55.26], [55.0, 55.32], [56.0, 83.78], [85.0, 96.55], [99.0, 135.14], [136.0, 137.94], [139.0, 139.9], [142.0, 142.97], [145.0, 148.14], [150.0, 168.15], [170.0, 170.16]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.99, 36.11, 66.76, 0.0, 0.0, 53.97, 39.75, 0.0, 0.0, 0.0, 0.0, 100.0, 83.52, 0.0], "audiomae_on_audioset": [[["hum", 37.66], ["mains hum", 24.96], ["music", 22.75]], [["speech", 22.58], ["vehicle", 21.04], ["car", 9.59]], null, null, null, null, [["mosquito", 58.28], ["fly, housefly", 25.06], ["fart", 6.16]], null, null, null, null, null, null, null], "duration": [26.46, 6.72, 13.81, 1.26, 0.32, 27.78, 11.55, 36.14, 1.94, 0.9, 0.97, 3.14, 18.15, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/-WOw8ePUCEo_filtered.json b/annotations_filtered/-WOw8ePUCEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10a2827c0d4e6812d2136c0049bab67a33005a92 --- /dev/null +++ b/annotations_filtered/-WOw8ePUCEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.23], [15.0, 19.38], [21.0, 24.78], [26.0, 27.87], [31.0, 30.74], [32.0, 33.07], [35.0, 35.36], [37.0, 36.96], [39.0, 39.14], [40.0, 41.81], [43.0, 43.75], [47.0, 46.95], [48.0, 49.06], [51.0, 51.14], [55.0, 56.12], [58.0, 58.83], [61.0, 61.99], [64.0, 65.7], [68.0, 68.54], [70.0, 77.82], [84.0, 85.55], [91.0, 95.57], [97.0, 101.26], [104.0, 106.66], [110.0, 113.04], [117.0, 119.33]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.73, 51.12, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 97.33, 98.27, 99.78, 100.0, 93.45], "audiomae_on_audioset": [[["speech", 35.98], ["music", 17.92], ["percussion", 11.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 4.38, 3.78, 1.87, -0.26, 1.07, 0.36, -0.04, 0.14, 1.81, 0.75, -0.05, 1.06, 0.14, 1.12, 0.83, 0.99, 1.7, 0.54, 7.82, 1.55, 4.57, 4.26, 2.66, 3.04, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/-WW51YaWO-4_filtered.json b/annotations_filtered/-WW51YaWO-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f029a5dda90fba4122f1cb53df96365513416ee --- /dev/null +++ b/annotations_filtered/-WW51YaWO-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.55], [13.0, 15.69], [17.0, 17.36], [18.0, 23.85], [24.0, 30.16], [31.0, 31.26], [32.0, 32.61], [34.0, 34.72], [35.0, 36.83], [38.0, 39.56], [42.0, 42.23], [43.0, 46.03], [51.0, 51.26], [61.0, 63.19], [68.0, 69.9], [73.0, 75.78], [81.0, 84.54], [86.0, 87.03], [91.0, 91.86], [93.0, 98.78], [99.0, 100.5], [101.0, 103.3], [104.0, 105.93]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [41.54, 99.59, 0.0, 95.51, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.43, 0.0, 99.96, 0.0, 98.44, 98.36, 0.0, 0.0, 45.88, 0.0, 88.28, 0.0], "audiomae_on_audioset": [[["chirp tone", 52.4], ["speech", 23.71], ["sine wave", 19.76]], null, null, null, [["speech", 40.96], ["burping, eructation", 7.72], ["dial tone", 7.47]], null, null, null, null, null, null, [["speech", 20.86], ["sine wave", 17.51], ["tuning fork", 12.43]], null, null, null, null, null, null, null, [["sidetone", 38.06], ["hum", 7.18], ["music", 6.3]], null, null, null], "duration": [3.55, 2.69, 0.36, 5.85, 6.16, 0.26, 0.61, 0.72, 1.83, 1.56, 0.23, 3.03, 0.26, 2.19, 1.9, 2.78, 3.54, 1.03, 0.86, 5.78, 1.5, 2.3, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/-W_4EZvbrEI_filtered.json b/annotations_filtered/-W_4EZvbrEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7238aeacf2a7e7b9ea7ef36681980041ec78499 --- /dev/null +++ b/annotations_filtered/-W_4EZvbrEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 42.5], [44.0, 47.21], [49.0, 63.21], [70.0, 69.99], [81.0, 85.89], [87.0, 92.74], [93.0, 95.5], [97.0, 98.49], [101.0, 112.33]], "keep_status": [true, true, false, false, true, true, true, false, true], "silence_prob": [31.31, 30.0, 31.25, 0.0, 29.86, 30.14, 30.23, 0.0, 30.53], "audiomae_on_audioset": [[["speech", 46.94], ["music", 13.86], ["throbbing", 5.54]], [["music", 16.28], ["vehicle", 12.39], ["car", 11.42]], [["didgeridoo", 50.47], ["music", 36.43], ["electronic music", 1.59]], null, [["speech", 37.59], ["vehicle", 15.24], ["car", 10.97]], [["music", 24.08], ["boing", 18.44], ["speech", 17.03]], [["music", 22.51], ["speech", 8.93], ["jet engine", 5.49]], null, [["music", 51.01], ["fly, housefly", 5.83], ["buzz", 4.53]]], "duration": [8.5, 3.21, 14.21, -0.01, 4.89, 5.74, 2.5, 1.49, 11.33]} \ No newline at end of file diff --git a/annotations_filtered/-WbsnXGKkIg_filtered.json b/annotations_filtered/-WbsnXGKkIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84766d04e9c58bed6759a11a75fa5e518483cbcf --- /dev/null +++ b/annotations_filtered/-WbsnXGKkIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.54], [26.0, 27.08], [27.0, 28.39], [31.0, 30.96], [32.0, 33.29], [35.0, 35.78], [37.0, 38.47], [39.0, 43.34], [44.0, 45.79], [47.0, 48.37], [50.0, 51.6], [53.0, 54.72], [56.0, 56.54], [59.0, 67.93], [70.0, 79.41], [80.0, 91.52], [92.0, 92.7], [95.0, 95.1], [96.0, 96.2], [98.0, 111.57], [113.0, 174.36], [177.0, 177.08], [178.0, 179.17], [180.0, 181.04], [184.0, 186.83], [187.0, 195.49], [197.0, 199.15], [200.0, 201.23], [202.0, 202.95], [206.0, 206.61], [207.0, 209.07], [210.0, 211.82], [212.0, 214.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 74.76, 60.89, 0.0, 0.0, 0.0, 42.13, 0.0, 0.0, 0.0, 0.0, 93.29, 59.86, 100.0, 0.0, 0.0, 0.0, 51.5, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.01], ["beatboxing", 6.09], ["fart", 5.77]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.54, 1.08, 1.39, -0.04, 1.29, 0.78, 1.47, 4.34, 1.79, 1.37, 1.6, 1.72, 0.54, 8.93, 9.41, 11.52, 0.7, 0.1, 0.2, 13.57, 61.36, 0.08, 1.17, 1.04, 2.83, 8.49, 2.15, 1.23, 0.95, 0.61, 2.07, 1.82, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/-WmDszVxti0_filtered.json b/annotations_filtered/-WmDszVxti0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbf83642700d18a813035890ea060df5699b3533 --- /dev/null +++ b/annotations_filtered/-WmDszVxti0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [2.0, 2.57], [5.0, 6.3], [8.0, 20.53], [27.0, 27.28], [32.0, 63.17], [66.0, 92.16], [94.0, 98.81], [100.0, 108.26], [109.0, 109.16], [110.0, 115.79], [118.0, 118.17], [119.0, 119.33], [124.0, 133.29], [135.0, 160.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.78, 0.0, 0.0, 30.05, 31.56, 31.15, 0.0, 29.67, 0.0, 0.0, 31.69, 29.55], "audiomae_on_audioset": [null, null, null, [["music", 65.44], ["didgeridoo", 7.32], ["explosion", 7.01]], null, null, [["music", 44.41], ["hum", 18.83], ["mains hum", 9.54]], [["music", 40.66], ["didgeridoo", 18.48], ["speech", 8.89]], [["music", 49.83], ["speech", 33.37], ["foghorn", 3.65]], null, [["hum", 18.94], ["whip", 18.22], ["music", 14.56]], null, null, [["music", 44.49], ["throbbing", 11.28], ["didgeridoo", 9.82]], [["music", 51.43], ["speech", 22.12], ["throbbing", 4.32]]], "duration": [0.38, 0.57, 1.3, 12.53, 0.28, 31.17, 26.16, 4.81, 8.26, 0.16, 5.79, 0.17, 0.33, 9.29, 25.39]} \ No newline at end of file diff --git a/annotations_filtered/-WrDbBvPN00_filtered.json b/annotations_filtered/-WrDbBvPN00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-WrDbBvPN00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-Ww_Bo5ghiw_filtered.json b/annotations_filtered/-Ww_Bo5ghiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..005024017920beaf27fba0428f1c240ef686e839 --- /dev/null +++ b/annotations_filtered/-Ww_Bo5ghiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.64], [8.0, 9.22], [10.0, 11.28], [12.0, 12.92], [16.0, 15.97], [21.0, 21.25], [26.0, 27.67], [29.0, 30.77], [33.0, 39.51], [41.0, 47.46], [48.0, 51.44], [54.0, 57.99], [59.0, 65.1], [68.0, 70.41], [78.0, 79.32], [81.0, 81.53], [83.0, 83.19], [84.0, 86.43], [89.0, 88.65], [91.0, 93.97], [95.0, 99.84], [103.0, 112.46], [116.0, 123.08], [125.0, 125.51], [127.0, 139.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 74.13, 79.07, 72.46, 56.25, 68.41, 0.0, 0.0, 0.0, 59.24, 0.0, 57.4, 71.57, 73.67, 42.28, 0.0, 46.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.88], ["music", 8.69], ["hum", 2.18]], null, [["music", 55.1], ["hum", 16.62], ["electronic music", 4.06]]], "duration": [1.64, 1.22, 1.28, 0.92, -0.03, 0.25, 1.67, 1.77, 6.51, 6.46, 3.44, 3.99, 6.1, 2.41, 1.32, 0.53, 0.19, 2.43, -0.35, 2.97, 4.84, 9.46, 7.08, 0.51, 12.9]} \ No newline at end of file diff --git a/annotations_filtered/-XCvw6NPfVM_filtered.json b/annotations_filtered/-XCvw6NPfVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae093e14af5fd05638a6e4682f53b7f7e4e67eb1 --- /dev/null +++ b/annotations_filtered/-XCvw6NPfVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.05], [6.0, 7.15], [13.0, 14.84], [16.0, 16.61], [17.0, 19.74], [23.0, 25.61], [26.0, 29.46], [31.0, 47.65], [49.0, 70.5], [73.0, 73.28], [74.0, 86.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.32, 0.0, 0.0, 0.0, 100.0, 99.92, 100.0, 99.99, 99.16, 0.0, 84.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [3.05, 1.15, 1.84, 0.61, 2.74, 2.61, 3.46, 16.65, 21.5, 0.28, 12.32]} \ No newline at end of file diff --git a/annotations_filtered/-Xb-ryuTDlE_filtered.json b/annotations_filtered/-Xb-ryuTDlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47a7f9a56490b0c8fdb7a24e5eeeb289af417827 --- /dev/null +++ b/annotations_filtered/-Xb-ryuTDlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.86], [16.0, 16.36], [17.0, 18.15], [19.0, 19.6], [21.0, 21.83], [24.0, 27.33], [28.0, 34.35], [36.0, 38.74]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 75.55, 74.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.86, 0.36, 1.15, 0.6, 0.83, 3.33, 6.35, 2.74]} \ No newline at end of file diff --git a/annotations_filtered/-XggDv2QdHg_filtered.json b/annotations_filtered/-XggDv2QdHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49153d9b2492cddd70320dd543776634fc0c2d27 --- /dev/null +++ b/annotations_filtered/-XggDv2QdHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.68], [17.0, 19.75], [23.0, 28.88], [32.0, 33.79], [36.0, 36.27], [38.0, 38.5], [40.0, 40.29], [52.0, 53.86], [55.0, 55.98], [58.0, 60.4], [62.0, 63.96], [65.0, 67.1], [69.0, 69.36], [70.0, 74.36], [82.0, 83.05], [84.0, 84.7], [86.0, 86.04], [87.0, 89.13], [91.0, 92.06], [95.0, 95.42], [98.0, 99.69], [100.0, 103.92], [107.0, 108.97], [111.0, 113.73], [114.0, 113.83], [114.0, 117.31], [119.0, 122.15], [124.0, 125.19], [126.0, 129.69], [131.0, 132.04], [132.0, 133.12], [134.0, 134.15], [136.0, 138.18], [138.0, 139.77], [141.0, 143.8], [145.0, 148.2], [149.0, 150.13], [151.0, 151.53], [154.0, 154.5], [155.0, 156.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.85, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 99.59, 0.0, 100.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 100.0, 0.0, 99.95, 0.0, 81.0, 99.52, 0.0, 83.52, 0.0, 0.0, 0.0, 99.36, 0.0, 98.27, 95.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.68, 2.75, 5.88, 1.79, 0.27, 0.5, 0.29, 1.86, 0.98, 2.4, 1.96, 2.1, 0.36, 4.36, 1.05, 0.7, 0.04, 2.13, 1.06, 0.42, 1.69, 3.92, 1.97, 2.73, -0.17, 3.31, 3.15, 1.19, 3.69, 1.04, 1.12, 0.15, 2.18, 1.77, 2.8, 3.2, 1.13, 0.53, 0.5, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/-Y1lyQpBVJI_filtered.json b/annotations_filtered/-Y1lyQpBVJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c78b753b938d2fbf6b601e8df37eab9432bc4066 --- /dev/null +++ b/annotations_filtered/-Y1lyQpBVJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.77], [1.0, 1.49], [4.0, 4.75], [5.0, 5.51], [8.0, 8.43], [9.0, 9.51], [11.0, 11.55], [27.0, 27.41]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [-0.23, 0.49, 0.75, 0.51, 0.43, 0.51, 0.55, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/-Y2wqkD2KVM_filtered.json b/annotations_filtered/-Y2wqkD2KVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efb4b8382e1fdf55e313dbce928c3991e4a7e209 --- /dev/null +++ b/annotations_filtered/-Y2wqkD2KVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 32.98], [33.0, 33.03], [35.0, 75.47], [77.0, 77.31], [77.0, 99.5], [100.0, 100.89], [102.0, 130.76]], "keep_status": [true, false, false, false, false, false, true], "silence_prob": [31.67, 0.0, 0.0, 0.0, 34.18, 0.0, 30.13], "audiomae_on_audioset": [[["music", 50.93], ["trombone", 9.19], ["brass instrument", 5.2]], null, null, null, [["music", 70.11], ["musical instrument", 6.2], ["synthesizer", 4.52]], null, [["livestock, farm animals, working animals", 18.37], ["moo", 9.83], ["cattle, bovinae", 9.47]]], "duration": [24.98, 0.03, 40.47, 0.31, 22.5, 0.89, 28.76]} \ No newline at end of file diff --git a/annotations_filtered/-Y3tZpAdWTc_filtered.json b/annotations_filtered/-Y3tZpAdWTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fda5f53bf42d7d09edd07fe915a8e13c3889736 --- /dev/null +++ b/annotations_filtered/-Y3tZpAdWTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [5.0, 6.34], [7.0, 9.32], [10.0, 10.37], [11.0, 11.58], [12.0, 12.51], [18.0, 21.41], [26.0, 26.08], [29.0, 30.33], [32.0, 33.03], [35.0, 35.72], [37.0, 38.97], [40.0, 40.27], [47.0, 47.21], [51.0, 52.44], [53.0, 54.33], [56.0, 55.97], [57.0, 57.38], [62.0, 62.38], [65.0, 65.72], [68.0, 68.45], [71.0, 71.68], [74.0, 73.94], [81.0, 81.94], [84.0, 84.42], [85.0, 85.6], [90.0, 90.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 1.34, 2.32, 0.37, 0.58, 0.51, 3.41, 0.08, 1.33, 1.03, 0.72, 1.97, 0.27, 0.21, 1.44, 1.33, -0.03, 0.38, 0.38, 0.72, 0.45, 0.68, -0.06, 0.94, 0.42, 0.6, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/-YGxccN_j6o_filtered.json b/annotations_filtered/-YGxccN_j6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b112b11aba0f4fbf0dd298c11c3b9b926023e052 --- /dev/null +++ b/annotations_filtered/-YGxccN_j6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.22], [12.0, 12.18], [13.0, 13.19], [16.0, 16.63], [19.0, 19.26], [20.0, 19.77], [20.0, 20.51], [21.0, 21.96], [23.0, 23.35], [25.0, 25.44], [27.0, 27.41], [29.0, 30.0], [32.0, 32.7], [35.0, 36.75], [37.0, 37.22], [37.0, 38.48], [39.0, 40.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.18, 0.19, 0.63, 0.26, -0.23, 0.51, 0.96, 0.35, 0.44, 0.41, 1.0, 0.7, 1.75, 0.22, 1.48, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/-YTLGLeKoJQ_filtered.json b/annotations_filtered/-YTLGLeKoJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d7981f92c0c4e35728d13dd5801d8ad1d69b651 --- /dev/null +++ b/annotations_filtered/-YTLGLeKoJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 49.44], [50.0, 57.15], [58.0, 58.99], [61.0, 61.4], [64.0, 65.03], [66.0, 67.81], [70.0, 73.97], [75.0, 95.4], [96.0, 99.05], [102.0, 103.87], [105.0, 112.5], [114.0, 114.2], [114.0, 118.96], [120.0, 120.88], [122.0, 127.08], [128.0, 128.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 82.07, 36.25, 99.94, 0.0, 72.75, 0.0, 58.3, 0.0, 67.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 66.25], ["burst, pop", 3.06], ["explosion", 2.92]], null, null, null, null, null, null, null, null], "duration": [1.44, 7.15, 0.99, 0.4, 1.03, 1.81, 3.97, 20.4, 3.05, 1.87, 7.5, 0.2, 4.96, 0.88, 5.08, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/-YV8tJhGojY_filtered.json b/annotations_filtered/-YV8tJhGojY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9ae3fec7a2d801934c5d3725971d38d0c69564d --- /dev/null +++ b/annotations_filtered/-YV8tJhGojY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.41], [9.0, 9.71], [10.0, 10.44], [12.0, 12.87], [18.0, 18.96], [24.0, 25.24], [26.0, 30.42], [32.0, 32.22], [33.0, 34.11], [37.0, 37.32], [40.0, 40.22], [41.0, 41.88], [45.0, 45.82], [47.0, 47.9], [52.0, 52.42], [53.0, 54.31], [55.0, 55.75], [57.0, 56.91], [87.0, 86.63], [87.0, 87.79], [90.0, 93.02], [94.0, 97.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 99.4], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 38.46], ["moo", 34.48], ["livestock, farm animals, working animals", 13.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 0.71, 0.44, 0.87, 0.96, 1.24, 4.42, 0.22, 1.11, 0.32, 0.22, 0.88, 0.82, 0.9, 0.42, 1.31, 0.75, -0.09, -0.37, 0.79, 3.02, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/-YaPh7shnWQ_filtered.json b/annotations_filtered/-YaPh7shnWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731184072009e93618da028a18f41f99eb0e7247 --- /dev/null +++ b/annotations_filtered/-YaPh7shnWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.15], [3.0, 4.04], [5.0, 6.81], [7.0, 9.46], [24.0, 24.38], [25.0, 25.84], [42.0, 42.62], [51.0, 51.16], [58.0, 58.77], [59.0, 60.22], [64.0, 65.62], [76.0, 78.95], [81.0, 81.6], [82.0, 81.63], [84.0, 83.67], [94.0, 96.15], [100.0, 101.06], [101.0, 101.49], [102.0, 101.6], [102.0, 104.01], [107.0, 110.05], [115.0, 116.82], [118.0, 119.94], [127.0, 128.19], [135.0, 142.99], [144.0, 148.29], [149.0, 149.5], [163.0, 164.91], [167.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 92.48, 99.95, 0.0, 0.0, 0.0, 99.95, 84.62, 0.0, 0.0, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 1.04, 1.81, 2.46, 0.38, 0.84, 0.62, 0.16, 0.77, 1.22, 1.62, 2.95, 0.6, -0.37, -0.33, 2.15, 1.06, 0.49, -0.4, 2.01, 3.05, 1.82, 1.94, 1.19, 7.99, 4.29, 0.5, 1.91, 6.23]} \ No newline at end of file diff --git a/annotations_filtered/-YiImyOVCj4_filtered.json b/annotations_filtered/-YiImyOVCj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55bbfbbb3e0f7724b51ad8ecf4c8d450d69a8653 --- /dev/null +++ b/annotations_filtered/-YiImyOVCj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [3.0, 4.99], [6.0, 7.59], [9.0, 9.85], [11.0, 12.33], [15.0, 19.36], [20.0, 20.66], [24.0, 23.94], [25.0, 26.28], [27.0, 27.92], [32.0, 31.95], [35.0, 36.81], [39.0, 40.07], [42.0, 43.02], [43.0, 43.98], [45.0, 46.38], [47.0, 48.52], [52.0, 53.35], [54.0, 56.12], [57.0, 60.24], [62.0, 63.64], [66.0, 66.26], [71.0, 71.56], [77.0, 83.0], [86.0, 86.83], [90.0, 91.45], [94.0, 94.76], [101.0, 101.8], [109.0, 109.61], [110.0, 111.18], [114.0, 116.18], [127.0, 127.36], [129.0, 130.08], [132.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 51.44, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.99, 1.59, 0.85, 1.33, 4.36, 0.66, -0.06, 1.28, 0.92, -0.05, 1.81, 1.07, 1.02, 0.98, 1.38, 1.52, 1.35, 2.12, 3.24, 1.64, 0.26, 0.56, 6.0, 0.83, 1.45, 0.76, 0.8, 0.61, 1.18, 2.18, 0.36, 1.08, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/-YykCz0f3Vk_filtered.json b/annotations_filtered/-YykCz0f3Vk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4455e559691228b7d6082d4fc6c127faef48b543 --- /dev/null +++ b/annotations_filtered/-YykCz0f3Vk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.77], [13.0, 93.95]], "keep_status": [false, false], "silence_prob": [100.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [5.77, 80.95]} \ No newline at end of file diff --git a/annotations_filtered/-ZRSgs6PHaY_filtered.json b/annotations_filtered/-ZRSgs6PHaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48f43f8cbb60bf47c456cbea9ddd59f71781e60e --- /dev/null +++ b/annotations_filtered/-ZRSgs6PHaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.95], [26.0, 26.81], [28.0, 28.27], [29.0, 29.94], [31.0, 31.7], [32.0, 33.78], [34.0, 35.5], [39.0, 40.63], [43.0, 43.71], [48.0, 48.2], [48.0, 49.52], [50.0, 51.38], [54.0, 58.73], [63.0, 81.97], [85.0, 85.58], [86.0, 86.32], [111.0, 116.7], [118.0, 117.95], [118.0, 118.05], [118.0, 121.81], [122.0, 123.57], [127.0, 127.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 28.91, 0.0, 0.0, 30.01, 0.0, 0.0, 36.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 24.9], ["speech", 14.71], ["fly, housefly", 9.15]], [["speech", 54.11], ["music", 33.27], ["sound effect", 1.39]], null, null, [["mains hum", 49.27], ["hum", 34.45], ["throbbing", 5.39]], null, null, [["speech", 54.69], ["radio", 5.88], ["sneeze", 5.53]], null, null], "duration": [0.95, 0.81, 0.27, 0.94, 0.7, 1.78, 1.5, 1.63, 0.71, 0.2, 1.52, 1.38, 4.73, 18.97, 0.58, 0.32, 5.7, -0.05, 0.05, 3.81, 1.57, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/-ZlL0LLfjKY_filtered.json b/annotations_filtered/-ZlL0LLfjKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d4420bf6d1a69f1a94b3cd11031d498ec709e2f --- /dev/null +++ b/annotations_filtered/-ZlL0LLfjKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.64], [9.0, 9.58], [14.0, 14.74], [15.0, 15.85], [17.0, 17.39], [23.0, 23.53], [24.0, 27.21], [30.0, 31.77], [34.0, 37.05], [38.0, 39.26], [41.0, 42.87], [45.0, 45.42], [52.0, 52.32], [53.0, 53.47], [57.0, 57.65], [59.0, 60.35], [62.0, 62.75], [64.0, 68.13], [71.0, 71.46], [72.0, 72.77], [73.0, 83.94], [86.0, 89.9], [99.0, 99.06], [104.0, 106.39], [107.0, 107.86], [124.0, 124.39], [126.0, 126.45], [131.0, 132.34], [142.0, 143.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 93.76, 51.23, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.36, 0.58, 0.74, 0.85, 0.39, 0.53, 3.21, 1.77, 3.05, 1.26, 1.87, 0.42, 0.32, 0.47, 0.65, 1.35, 0.75, 4.13, 0.46, 0.77, 10.94, 3.9, 0.06, 2.39, 0.86, 0.39, 0.45, 1.34, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/-Zr-B5aIEvE_filtered.json b/annotations_filtered/-Zr-B5aIEvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba9c1bfe42f59edeb39bc526f078c7d5002f4fd5 --- /dev/null +++ b/annotations_filtered/-Zr-B5aIEvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 35.18], [38.0, 98.32], [101.0, 133.22], [140.0, 159.61], [161.0, 164.91], [167.0, 182.87]], "keep_status": [true, false, false, true, false, false], "silence_prob": [36.56, 0.0, 0.0, 37.62, 55.11, 41.62], "audiomae_on_audioset": [[["hum", 33.4], ["music", 14.43], ["mains hum", 13.8]], null, null, [["music", 50.64], ["throbbing", 9.83], ["electronic music", 8.58]], null, [["speech", 41.73], ["sidetone", 16.96], ["music", 11.56]]], "duration": [18.18, 60.32, 32.22, 19.61, 3.91, 15.87]} \ No newline at end of file diff --git a/annotations_filtered/-ZxtmDbqDRc_filtered.json b/annotations_filtered/-ZxtmDbqDRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ee7befc5a36c161029c42bedef9014586caee25 --- /dev/null +++ b/annotations_filtered/-ZxtmDbqDRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.53], [3.0, 4.9], [6.0, 6.13], [10.0, 10.88], [13.0, 13.29], [19.0, 30.13], [33.0, 33.49], [35.0, 35.5], [42.0, 42.55], [47.0, 47.01], [47.0, 47.22], [50.0, 50.82], [55.0, 55.73], [58.0, 57.74], [58.0, 62.56], [65.0, 66.07], [68.0, 67.86], [69.0, 69.85], [79.0, 79.68], [81.0, 81.21], [83.0, 83.71], [90.0, 90.31], [110.0, 110.13], [112.0, 112.04], [113.0, 113.83], [114.0, 114.54], [118.0, 118.47], [120.0, 120.85], [122.0, 123.43], [124.0, 124.71], [125.0, 125.61], [127.0, 129.79], [131.0, 136.93], [141.0, 144.46], [148.0, 155.85], [158.0, 158.28], [159.0, 163.66], [168.0, 170.16], [171.0, 172.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.38, 29.21, 30.81, 29.5, 0.0, 30.03, 29.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 80.42], ["music", 15.08], ["whack, thwack", 0.48]], null, null, null, null, null, null, null, null, [["speech", 55.72], ["whack, thwack", 7.75], ["music", 5.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.46], ["speech", 13.65], ["theremin", 3.32]], [["music", 32.61], ["speech", 24.87], ["throbbing", 5.52]], [["music", 47.35], ["throbbing", 29.94], ["electronic music", 4.61]], [["breaking", 33.03], ["music", 27.48], ["glass", 4.49]], null, [["music", 52.67], ["theremin", 21.57], ["hum", 3.74]], [["speech", 42.86], ["civil defense siren", 22.16], ["siren", 3.53]], null], "duration": [1.53, 1.9, 0.13, 0.88, 0.29, 11.13, 0.49, 0.5, 0.55, 0.01, 0.22, 0.82, 0.73, -0.26, 4.56, 1.07, -0.14, 0.85, 0.68, 0.21, 0.71, 0.31, 0.13, 0.04, 0.83, 0.54, 0.47, 0.85, 1.43, 0.71, 0.61, 2.79, 5.93, 3.46, 7.85, 0.28, 4.66, 2.16, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/-_Bdf9C0SAU_filtered.json b/annotations_filtered/-_Bdf9C0SAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a6d6df0f7c08b01fa35a47e665ba1f4d9cf17b5 --- /dev/null +++ b/annotations_filtered/-_Bdf9C0SAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.65], [14.0, 18.57], [21.0, 26.25], [27.0, 28.39], [29.0, 30.32], [31.0, 33.03], [40.0, 40.73], [43.0, 45.94], [46.0, 46.67], [47.0, 48.61], [58.0, 58.62], [70.0, 70.61], [71.0, 74.85], [78.0, 78.41], [82.0, 83.17], [85.0, 85.48], [86.0, 87.0], [90.0, 90.51], [93.0, 93.65], [95.0, 107.45], [108.0, 110.05], [114.0, 115.33], [120.0, 123.4]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [47.08, 44.87, 47.23, 0.0, 0.0, 46.33, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 39.88, 0.0, 66.39], "audiomae_on_audioset": [[["hum", 34.01], ["throbbing", 20.71], ["mains hum", 6.84]], [["hum", 44.99], ["throbbing", 14.01], ["speech", 8.43]], [["hum", 56.51], ["throbbing", 17.52], ["mains hum", 15.5]], null, null, [["hum", 49.51], ["mains hum", 18.31], ["throbbing", 15.24]], null, null, null, null, null, null, [["hum", 60.07], ["mains hum", 23.13], ["throbbing", 8.43]], null, null, null, null, null, null, [["hum", 44.63], ["speech", 12.52], ["throbbing", 10.63]], [["hum", 31.92], ["music", 11.91], ["mains hum", 11.66]], null, null], "duration": [9.65, 4.57, 5.25, 1.39, 1.32, 2.03, 0.73, 2.94, 0.67, 1.61, 0.62, 0.61, 3.85, 0.41, 1.17, 0.48, 1.0, 0.51, 0.65, 12.45, 2.05, 1.33, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/-_HlyIgHUa0_filtered.json b/annotations_filtered/-_HlyIgHUa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b86b3adff26d74de769213cb044c64de66a108f --- /dev/null +++ b/annotations_filtered/-_HlyIgHUa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.62], [7.0, 9.91], [13.0, 16.12], [17.0, 20.16], [21.0, 24.7], [25.0, 28.46], [30.0, 32.88], [35.0, 38.03], [38.0, 41.96], [46.0, 48.61], [50.0, 53.84], [55.0, 58.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.94, 99.98, 99.96, 99.98, 99.82, 85.35, 98.66, 99.95, 73.36, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 2.91, 3.12, 3.16, 3.7, 3.46, 2.88, 3.03, 3.96, 2.61, 3.84, 3.02]} \ No newline at end of file diff --git a/annotations_filtered/-_XIgfmDa1s_filtered.json b/annotations_filtered/-_XIgfmDa1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fba7b1ffcd4f41c30f07a474922e5ae8ae85fc9 --- /dev/null +++ b/annotations_filtered/-_XIgfmDa1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.47], [8.0, 9.61], [18.0, 19.2], [25.0, 33.67], [34.0, 35.34], [40.0, 42.52], [45.0, 48.1], [49.0, 57.25], [61.0, 60.88], [63.0, 70.55], [76.0, 76.94], [77.0, 78.34], [80.0, 80.72], [85.0, 85.31], [86.0, 86.32], [88.0, 88.4], [89.0, 92.85], [95.0, 100.85], [101.0, 102.44], [104.0, 116.14], [117.0, 120.75], [129.0, 129.09], [130.0, 130.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [40.62, 0.0, 0.0, 32.85, 0.0, 98.86, 99.94, 99.44, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.18, 57.09, 0.0, 74.44, 44.12, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 67.11], ["tuning fork", 8.52], ["inside, small room", 3.12]], null, null, [["speech", 58.27], ["gong", 3.11], ["hum", 3.0]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.46], ["sidetone", 21.46], ["sine wave", 5.78]], null, null, null, [["sidetone", 32.51], ["speech", 19.18], ["hum", 14.1]], null, null], "duration": [2.47, 1.61, 1.2, 8.67, 1.34, 2.52, 3.1, 8.25, -0.12, 7.55, 0.94, 1.34, 0.72, 0.31, 0.32, 0.4, 3.85, 5.85, 1.44, 12.14, 3.75, 0.09, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/-_YHQheqKxE_filtered.json b/annotations_filtered/-_YHQheqKxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b89668dd2b91ce6b9d9a76d5670f3f0987b382b --- /dev/null +++ b/annotations_filtered/-_YHQheqKxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 55.22], [58.0, 58.87], [59.0, 60.62], [61.0, 79.95], [84.0, 101.41], [102.0, 117.64]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.78, 31.33, 30.37], "audiomae_on_audioset": [null, null, null, [["music", 59.67], ["synthesizer", 4.51], ["electronic music", 3.11]], [["music", 66.95], ["didgeridoo", 14.3], ["speech", 2.35]], [["buzz", 74.52], ["music", 8.58], ["insect", 2.19]]], "duration": [53.22, 0.87, 1.62, 18.95, 17.41, 15.64]} \ No newline at end of file diff --git a/annotations_filtered/-a1FAp677Vo_filtered.json b/annotations_filtered/-a1FAp677Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a9be38ace351788cd0637180600013ce65c055a --- /dev/null +++ b/annotations_filtered/-a1FAp677Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.05], [7.0, 28.19], [30.0, 35.92], [36.0, 42.69], [43.0, 44.41], [46.0, 48.46], [49.0, 51.11], [52.0, 90.58], [92.0, 94.59]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [100.0, 71.29, 96.17, 66.03, 0.0, 100.0, 99.96, 0.0, 39.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 19.67], ["synthesizer", 16.89], ["effects unit", 9.86]]], "duration": [3.05, 21.19, 5.92, 6.69, 1.41, 2.46, 2.11, 38.58, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/-agdK2N5wX4_filtered.json b/annotations_filtered/-agdK2N5wX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..611b60470ced1761cc3ea766efcaa94b840fd401 --- /dev/null +++ b/annotations_filtered/-agdK2N5wX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.36], [23.0, 23.75], [25.0, 25.93], [28.0, 30.77], [31.0, 32.64], [34.0, 35.82], [37.0, 39.12], [41.0, 41.54], [43.0, 43.66], [46.0, 46.35], [47.0, 52.37], [54.0, 58.94], [60.0, 62.51], [63.0, 70.6], [71.0, 72.93], [77.0, 78.97], [80.0, 81.8], [82.0, 88.28], [91.0, 94.73], [95.0, 120.41], [121.0, 124.31], [125.0, 126.22], [128.0, 129.07], [130.0, 132.12], [133.0, 166.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 70.86, 68.54, 69.47, 52.22, 0.0, 0.0, 0.0, 41.28, 41.5, 45.88, 61.77, 0.0, 0.0, 40.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.49], ["music", 26.07], ["quack", 4.73]], [["throbbing", 47.39], ["hum", 26.36], ["music", 9.93]], [["throbbing", 54.7], ["hum", 31.13], ["music", 5.59]], null, null, null, [["music", 16.53], ["sine wave", 13.52], ["sidetone", 6.44]], null], "duration": [0.36, 0.75, 0.93, 2.77, 1.64, 1.82, 2.12, 0.54, 0.66, 0.35, 5.37, 4.94, 2.51, 7.6, 1.93, 1.97, 1.8, 6.28, 3.73, 25.41, 3.31, 1.22, 1.07, 2.12, 33.24]} \ No newline at end of file diff --git a/annotations_filtered/-arTRBtT9d4_filtered.json b/annotations_filtered/-arTRBtT9d4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f22d5c10b4d5bbc6dc82a8bf1200f426ce0ecc1 --- /dev/null +++ b/annotations_filtered/-arTRBtT9d4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.44], [16.0, 17.22], [20.0, 23.63], [25.0, 24.98], [26.0, 27.04], [27.0, 28.05], [31.0, 32.61], [35.0, 39.68], [40.0, 42.11], [43.0, 45.79], [47.0, 47.51], [48.0, 49.96], [59.0, 65.91], [67.0, 73.35], [75.0, 74.9], [80.0, 81.92], [82.0, 88.8], [107.0, 107.18], [111.0, 113.09], [114.0, 115.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [42.46, 0.0, 35.34, 0.0, 0.0, 0.0, 0.0, 51.55, 91.64, 94.22, 0.0, 0.0, 30.09, 30.76, 0.0, 0.0, 29.75, 0.0, 35.35, 0.0], "audiomae_on_audioset": [[["speech", 60.81], ["fart", 27.92], ["fly, housefly", 1.66]], null, [["speech", 62.09], ["sidetone", 12.68], ["music", 5.46]], null, null, null, null, null, null, null, null, null, [["speech", 33.21], ["music", 26.39], ["boing", 13.13]], [["music", 61.79], ["speech", 18.46], ["boing", 2.09]], null, null, [["music", 35.71], ["boing", 31.4], ["speech", 11.65]], null, [["music", 45.77], ["dubstep", 10.8], ["electronic music", 8.43]], null], "duration": [7.44, 1.22, 3.63, -0.02, 1.04, 1.05, 1.61, 4.68, 2.11, 2.79, 0.51, 1.96, 6.91, 6.35, -0.1, 1.92, 6.8, 0.18, 2.09, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/-b-EFcA7ing_filtered.json b/annotations_filtered/-b-EFcA7ing_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cdd99c91558ded4503577b15199fb784c113782 --- /dev/null +++ b/annotations_filtered/-b-EFcA7ing_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.0], [25.0, 25.02], [28.0, 28.27], [33.0, 35.63], [49.0, 49.62], [53.0, 55.85], [67.0, 67.9], [71.0, 72.57], [82.0, 82.39], [87.0, 87.25], [99.0, 99.15], [100.0, 101.06], [106.0, 106.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.39, 0.0, 0.0, 48.74, 0.0, 67.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 38.43], ["fart", 14.23], ["door", 8.28]], null, null, [["music", 63.79], ["speech", 7.55], ["throbbing", 6.01]], null, null, null, null, null, null, null, null, null], "duration": [3.0, 0.02, 0.27, 2.63, 0.62, 2.85, 0.9, 1.57, 0.39, 0.25, 0.15, 1.06, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/-bG0iKaxQYM_filtered.json b/annotations_filtered/-bG0iKaxQYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3024f2585776dcce397bcd0da3b58c2f672600e7 --- /dev/null +++ b/annotations_filtered/-bG0iKaxQYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [6.0, 7.53], [8.0, 10.88], [12.0, 14.61], [17.0, 19.79], [20.0, 24.75], [25.0, 27.72], [28.0, 30.64], [31.0, 32.76], [36.0, 37.64], [39.0, 40.47], [42.0, 45.37], [47.0, 48.57], [53.0, 52.57], [53.0, 55.61], [56.0, 58.8], [61.0, 62.56], [64.0, 65.82], [67.0, 66.77], [68.0, 69.38], [72.0, 75.19], [76.0, 77.38], [81.0, 92.75], [95.0, 96.72], [98.0, 100.57], [102.0, 104.82], [115.0, 115.7], [116.0, 116.83], [118.0, 119.72], [123.0, 127.38], [128.0, 132.49], [133.0, 138.0], [139.0, 141.66], [143.0, 145.08]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.0, 99.26, 87.92, 79.59, 43.18, 98.93, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 89.19, 80.29, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 62.07, 0.0, 47.58, 34.8, 0.0, 0.0, 0.0, 94.07, 100.0, 99.56, 99.98, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 33.73], ["music", 17.65], ["hum", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.6], ["hum", 20.23], ["throbbing", 7.94]], [["music", 25.92], ["hum", 17.8], ["throbbing", 11.23]], null, null, null, null, null, null, null, null], "duration": [1.64, 1.53, 2.88, 2.61, 2.79, 4.75, 2.72, 2.64, 1.76, 1.64, 1.47, 3.37, 1.57, -0.43, 2.61, 2.8, 1.56, 1.82, -0.23, 1.38, 3.19, 1.38, 11.75, 1.72, 2.57, 2.82, 0.7, 0.83, 1.72, 4.38, 4.49, 5.0, 2.66, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/-bzOzD2QShQ_filtered.json b/annotations_filtered/-bzOzD2QShQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8802e6f9b989b62e191711fbebd9c6afb35e6428 --- /dev/null +++ b/annotations_filtered/-bzOzD2QShQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.24], [21.0, 22.71], [24.0, 26.2], [27.0, 27.51], [36.0, 37.98], [39.0, 40.58], [42.0, 46.92], [50.0, 50.67], [53.0, 54.4], [58.0, 60.81], [62.0, 62.55], [66.0, 72.89], [74.0, 74.83], [76.0, 76.91], [78.0, 79.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.64, 0.0, 88.1, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 45.85, 0.0, 55.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 51.46], ["music", 12.58], ["sidetone", 9.36]], null, null, null, null, null, null, null, null, [["speech", 69.92], ["sidetone", 15.75], ["radio", 4.39]], null, null, null, null, null], "duration": [4.24, 1.71, 2.2, 0.51, 1.98, 1.58, 4.92, 0.67, 1.4, 2.81, 0.55, 6.89, 0.83, 0.91, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/-c9-2KcnLXI_filtered.json b/annotations_filtered/-c9-2KcnLXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..863e0a9334f40392635940c8d243463b99f6b689 --- /dev/null +++ b/annotations_filtered/-c9-2KcnLXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.64], [24.0, 24.39], [25.0, 33.61], [34.0, 38.94], [41.0, 46.18], [48.0, 100.06], [102.0, 102.93], [103.0, 105.41], [107.0, 106.84], [108.0, 108.89]], "keep_status": [false, false, true, false, false, false, false, true, false, false], "silence_prob": [33.0, 0.0, 32.67, 32.83, 32.34, 0.0, 0.0, 43.33, 0.0, 0.0], "audiomae_on_audioset": [[["music", 58.23], ["throbbing", 22.61], ["hum", 4.18]], null, [["music", 45.21], ["throbbing", 16.12], ["hum", 7.23]], [["music", 65.66], ["synthesizer", 8.42], ["theremin", 5.72]], [["music", 77.77], ["synthesizer", 4.02], ["musical instrument", 3.83]], null, null, [["croak", 19.01], ["frog", 16.97], ["animal", 16.62]], null, null], "duration": [19.64, 0.39, 8.61, 4.94, 5.18, 52.06, 0.93, 2.41, -0.16, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/-cBGthOZ-Ls_filtered.json b/annotations_filtered/-cBGthOZ-Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..662e46680c183cec4fc9f998b8dd7bdf897bbebc --- /dev/null +++ b/annotations_filtered/-cBGthOZ-Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.68], [2.0, 2.51], [3.0, 5.05], [9.0, 9.66], [10.0, 11.92], [12.0, 12.06], [13.0, 13.42], [14.0, 16.53], [19.0, 19.55], [20.0, 20.09], [20.0, 21.91], [23.0, 23.08], [24.0, 35.33], [37.0, 39.77], [47.0, 47.34], [48.0, 54.18], [55.0, 57.47], [59.0, 59.31], [60.0, 60.71], [63.0, 63.41], [69.0, 70.28], [72.0, 72.35], [77.0, 84.21], [102.0, 103.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 93.76, 58.22, 0.0, 40.93, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 79.63], ["synthesizer", 7.3], ["musical instrument", 3.32]], [["music", 31.14], ["noise", 12.99], ["theremin", 10.22]], null, null, null, null, null, null, null], "duration": [-0.32, 0.51, 2.05, 0.66, 1.92, 0.06, 0.42, 2.53, 0.55, 0.09, 1.91, 0.08, 11.33, 2.77, 0.34, 6.18, 2.47, 0.31, 0.71, 0.41, 1.28, 0.35, 7.21, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/-cFW3A13o8s_filtered.json b/annotations_filtered/-cFW3A13o8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..521d4071e747c49b6407414373054f9914e397dc --- /dev/null +++ b/annotations_filtered/-cFW3A13o8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [10.0, 10.52], [11.0, 13.07], [17.0, 18.81], [20.0, 20.9], [26.0, 26.55], [27.0, 27.3], [28.0, 28.65], [30.0, 30.97], [32.0, 32.1], [34.0, 38.45], [41.0, 43.04], [44.0, 45.82], [51.0, 54.04], [55.0, 54.82], [56.0, 57.0], [58.0, 58.6], [62.0, 63.71], [65.0, 65.52], [72.0, 72.54], [75.0, 78.17], [82.0, 102.61], [104.0, 112.23], [113.0, 127.26], [130.0, 130.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 84.43, 0.0, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 54.76, 93.45, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.52, 2.07, 1.81, 0.9, 0.55, 0.3, 0.65, 0.97, 0.1, 4.45, 2.04, 1.82, 3.04, -0.18, 1.0, 0.6, 1.71, 0.52, 0.54, 3.17, 20.61, 8.23, 14.26, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/-c_ctZ4lUCk_filtered.json b/annotations_filtered/-c_ctZ4lUCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5d3eecec43d76937a4bae8fecb5550217da2563 --- /dev/null +++ b/annotations_filtered/-c_ctZ4lUCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.64], [17.0, 18.22], [23.0, 24.09], [30.0, 30.89], [32.0, 32.49], [34.0, 34.06], [35.0, 35.8], [42.0, 45.76], [46.0, 47.26], [52.0, 53.97], [59.0, 60.03], [65.0, 64.91], [73.0, 75.41], [82.0, 82.58], [84.0, 83.94], [91.0, 93.85], [99.0, 100.36], [103.0, 106.03], [109.0, 113.04], [114.0, 115.53], [117.0, 118.29], [120.0, 121.71], [124.0, 124.58], [130.0, 132.51], [133.0, 134.1]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.43, 0.0, 0.0, 0.0, 0.0, 34.03, 0.0, 0.0, 33.51, 0.0, 33.73, 33.81, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.85], ["hum", 12.14], ["mains hum", 4.95]], null, null, null, null, [["hum", 27.48], ["throbbing", 20.87], ["mains hum", 14.46]], null, null, [["hum", 36.34], ["music", 15.94], ["mains hum", 11.8]], null, [["hum", 30.73], ["music", 13.03], ["mains hum", 8.74]], [["hum", 58.12], ["throbbing", 15.11], ["mains hum", 14.6]], null, null, null, null, [["hum", 17.12], ["music", 12.08], ["mains hum", 10.27]], null], "duration": [0.64, 1.22, 1.09, 0.89, 0.49, 0.06, 0.8, 3.76, 1.26, 1.97, 1.03, -0.09, 2.41, 0.58, -0.06, 2.85, 1.36, 3.03, 4.04, 1.53, 1.29, 1.71, 0.58, 2.51, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/-cdk5mhKuWc_filtered.json b/annotations_filtered/-cdk5mhKuWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fedf11a7dde5b59d41bdec82e51fdb204e1de615 --- /dev/null +++ b/annotations_filtered/-cdk5mhKuWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [14.0, 25.52], [29.0, 33.88], [35.0, 34.96], [35.0, 70.95], [71.0, 81.97], [86.0, 114.72], [115.0, 116.43], [117.0, 123.96], [127.0, 129.46]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 49.4, 61.18, 0.0, 0.0, 37.38, 46.64, 0.0, 41.66, 39.21], "audiomae_on_audioset": [null, [["music", 67.95], ["musical instrument", 8.17], ["didgeridoo", 7.97]], null, null, null, [["music", 51.94], ["speech", 12.32], ["musical instrument", 9.97]], [["music", 25.42], ["gasp", 20.66], ["insect", 2.68]], null, [["music", 61.49], ["synthesizer", 8.01], ["effects unit", 7.18]], [["music", 66.92], ["sonar", 5.79], ["musical instrument", 4.29]]], "duration": [1.38, 11.52, 4.88, -0.04, 35.95, 10.97, 28.72, 1.43, 6.96, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/-dMBMU9FCQU_filtered.json b/annotations_filtered/-dMBMU9FCQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae38164d7d68f92829d88821be5174142bbe8718 --- /dev/null +++ b/annotations_filtered/-dMBMU9FCQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.74], [8.0, 8.97], [11.0, 13.96], [16.0, 18.4], [20.0, 58.33], [64.0, 64.35], [65.0, 73.23], [74.0, 75.37], [76.0, 78.49], [79.0, 81.41], [87.0, 87.94], [89.0, 89.48], [90.0, 115.18], [117.0, 118.08], [120.0, 120.29], [121.0, 132.7]], "keep_status": [false, false, true, true, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.61, 40.81, 0.0, 0.0, 38.5, 0.0, 37.39, 39.61, 0.0, 0.0, 29.66, 0.0, 0.0, 30.67], "audiomae_on_audioset": [null, null, [["music", 30.98], ["hum", 8.38], ["didgeridoo", 5.43]], [["speech", 21.04], ["hum", 19.83], ["music", 17.35]], null, null, [["whack, thwack", 21.52], ["hum", 10.72], ["mains hum", 7.14]], null, [["speech", 58.92], ["music", 10.83], ["sidetone", 3.64]], [["boing", 38.62], ["music", 14.26], ["throbbing", 8.56]], null, null, [["buzz", 67.79], ["music", 13.47], ["grunt", 4.99]], null, null, [["music", 32.97], ["speech", 25.54], ["mains hum", 16.12]]], "duration": [1.74, 0.97, 2.96, 2.4, 38.33, 0.35, 8.23, 1.37, 2.49, 2.41, 0.94, 0.48, 25.18, 1.08, 0.29, 11.7]} \ No newline at end of file diff --git a/annotations_filtered/-dUYR2apxdA_filtered.json b/annotations_filtered/-dUYR2apxdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e4f48841ab379ae393c19f31678580b9acc3093 --- /dev/null +++ b/annotations_filtered/-dUYR2apxdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [6.0, 12.82], [13.0, 14.54], [15.0, 16.01], [18.0, 18.18], [34.0, 41.93], [43.0, 43.93], [45.0, 47.04], [48.0, 50.75], [52.0, 53.87], [55.0, 58.68], [59.0, 65.57], [67.0, 69.47], [70.0, 78.16], [78.0, 78.49], [79.0, 78.81], [81.0, 82.31], [85.0, 86.73], [89.0, 89.26], [89.0, 89.45], [90.0, 91.03]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.9, 0.0, 0.0, 0.0, 70.72, 0.0, 86.82, 83.34, 0.0, 77.03, 71.72, 69.74, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 32.46], ["mains hum", 13.28], ["hum", 12.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 6.82, 1.54, 1.01, 0.18, 7.93, 0.93, 2.04, 2.75, 1.87, 3.68, 6.57, 2.47, 8.16, 0.49, -0.19, 1.31, 1.73, 0.26, 0.45, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/-dWENMR2aag_filtered.json b/annotations_filtered/-dWENMR2aag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dbeb656791e8698fb208f0ed6c433164a15d9d8 --- /dev/null +++ b/annotations_filtered/-dWENMR2aag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [20.0, 23.53], [24.0, 24.61], [26.0, 26.64], [43.0, 53.23], [57.0, 57.03], [57.0, 57.94], [58.0, 58.38], [59.0, 59.53], [60.0, 61.13], [63.0, 63.42], [65.0, 65.72], [74.0, 76.3], [83.0, 83.51], [84.0, 83.61], [89.0, 91.02], [93.0, 93.41], [94.0, 94.91], [96.0, 96.43], [97.0, 97.6], [100.0, 99.64], [100.0, 100.7], [102.0, 102.64], [103.0, 113.07], [118.0, 118.15], [120.0, 120.14], [120.0, 121.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.55, 0.0, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 35.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.8], ["didgeridoo", 29.74], ["musical instrument", 3.0]], null, null, [["music", 43.05], ["cattle, bovinae", 7.63], ["livestock, farm animals, working animals", 7.56]], null, null, null, null, null, null, null, [["speech", 22.27], ["music", 15.28], ["animal", 7.18]], null, null, [["speech", 28.75], ["livestock, farm animals, working animals", 9.55], ["boing", 9.05]], null, null, null, null, null, null, null, [["speech", 38.31], ["music", 32.51], ["didgeridoo", 7.01]], null, null, null], "duration": [1.34, 3.53, 0.61, 0.64, 10.23, 0.03, 0.94, 0.38, 0.53, 1.13, 0.42, 0.72, 2.3, 0.51, -0.39, 2.02, 0.41, 0.91, 0.43, 0.6, -0.36, 0.7, 0.64, 10.07, 0.15, 0.14, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/-dlOM4ocKUM_filtered.json b/annotations_filtered/-dlOM4ocKUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea07a6875f8c1e0788b85caa21e33659637a9f6b --- /dev/null +++ b/annotations_filtered/-dlOM4ocKUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.96], [19.0, 20.38], [22.0, 43.95], [45.0, 44.95], [46.0, 54.77], [56.0, 58.06], [59.0, 59.71], [61.0, 61.82], [64.0, 65.28], [66.0, 66.53], [68.0, 68.72], [69.0, 72.28], [74.0, 73.63], [76.0, 77.3], [79.0, 84.69], [85.0, 84.77], [85.0, 91.77], [92.0, 103.01], [106.0, 110.47], [111.0, 111.91], [114.0, 116.56], [117.0, 117.32], [120.0, 123.47], [124.0, 131.7], [134.0, 134.91], [135.0, 136.43], [137.0, 138.13], [140.0, 140.26], [144.0, 152.73], [154.0, 159.44], [160.0, 162.72], [165.0, 165.99], [167.0, 167.76], [169.0, 169.4], [171.0, 171.0], [172.0, 176.86], [180.0, 182.78], [183.0, 184.64], [186.0, 185.67]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, true, false, false, true, false, false, true, false, false, true, false, true, true, false, false, false, false, true, true, true, false, false, false, false, true, true, false, false], "silence_prob": [34.78, 0.0, 30.36, 0.0, 39.4, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0, 36.05, 0.0, 0.0, 29.88, 0.0, 29.45, 29.56, 32.06, 0.0, 34.12, 0.0, 30.17, 31.3, 0.0, 0.0, 0.0, 0.0, 30.87, 35.07, 35.94, 0.0, 0.0, 0.0, 0.0, 29.71, 29.89, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.51], ["mains hum", 27.84], ["hum", 12.36]], null, [["speech", 21.65], ["livestock, farm animals, working animals", 11.35], ["vehicle", 11.15]], null, [["music", 31.68], ["didgeridoo", 19.83], ["hum", 12.82]], [["music", 29.09], ["mains hum", 25.61], ["hum", 14.73]], null, null, null, null, null, [["hum", 23.8], ["mains hum", 23.76], ["speech", 15.3]], null, null, [["sidetone", 28.94], ["speech", 22.09], ["hum", 8.11]], null, [["music", 40.72], ["throbbing", 24.34], ["hum", 9.76]], [["speech", 46.18], ["music", 12.31], ["didgeridoo", 9.46]], [["sidetone", 53.08], ["speech", 13.66], ["music", 8.47]], null, [["speech", 24.13], ["music", 12.07], ["civil defense siren", 8.38]], null, [["explosion", 16.69], ["fart", 6.84], ["speech", 6.58]], [["speech", 21.64], ["music", 12.3], ["didgeridoo", 8.16]], null, null, null, null, [["music", 57.47], ["didgeridoo", 7.99], ["theremin", 3.71]], [["music", 31.24], ["hum", 17.93], ["throbbing", 16.31]], [["music", 52.7], ["theremin", 6.44], ["musical instrument", 5.65]], null, null, null, null, [["speech", 21.78], ["music", 15.32], ["animal", 10.53]], [["speech", 42.01], ["music", 7.49], ["fly, housefly", 4.68]], null, null], "duration": [3.96, 1.38, 21.95, -0.05, 8.77, 2.06, 0.71, 0.82, 1.28, 0.53, 0.72, 3.28, -0.37, 1.3, 5.69, -0.23, 6.77, 11.01, 4.47, 0.91, 2.56, 0.32, 3.47, 7.7, 0.91, 1.43, 1.13, 0.26, 8.73, 5.44, 2.72, 0.99, 0.76, 0.4, 0.0, 4.86, 2.78, 1.64, -0.33]} \ No newline at end of file diff --git a/annotations_filtered/-dzyuUNTwUo_filtered.json b/annotations_filtered/-dzyuUNTwUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ef818ee316fa4d33a9ef7f1bdf556e3212650ab --- /dev/null +++ b/annotations_filtered/-dzyuUNTwUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.99], [12.0, 12.11], [16.0, 17.58], [24.0, 24.24], [27.0, 31.16], [33.0, 43.31], [48.0, 51.48], [62.0, 62.4], [67.0, 67.9], [72.0, 72.55], [79.0, 81.13], [82.0, 84.03], [92.0, 92.7], [95.0, 97.09], [101.0, 102.0], [105.0, 105.31], [110.0, 112.77], [118.0, 118.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.23, 78.38, 85.9, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 94.66, 0.0, 0.0, 72.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 0.11, 1.58, 0.24, 4.16, 10.31, 3.48, 0.4, 0.9, 0.55, 2.13, 2.03, 0.7, 2.09, 1.0, 0.31, 2.77, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/-e3HqC2rbQc_filtered.json b/annotations_filtered/-e3HqC2rbQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21a610caca5347766aae1f1ab6f62a1c21ff027e --- /dev/null +++ b/annotations_filtered/-e3HqC2rbQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [6.0, 6.62], [8.0, 10.83], [13.0, 14.89], [16.0, 22.18], [23.0, 23.57], [25.0, 27.94], [30.0, 32.17], [32.0, 32.85], [38.0, 39.9], [42.0, 43.24], [47.0, 49.71], [51.0, 53.6], [54.0, 55.39], [59.0, 60.81], [61.0, 61.86], [62.0, 63.42], [65.0, 65.58], [68.0, 70.44], [71.0, 72.25], [74.0, 76.25], [77.0, 80.0], [80.0, 81.41], [83.0, 119.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 63.96, 0.0, 49.59, 0.0, 50.46, 72.6, 0.0, 0.0, 0.0, 69.88, 47.08, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 87.74, 51.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 45.09], ["mains hum", 16.65], ["fly, housefly", 14.39]], null, null, null, null, null, null, null, [["radio", 18.89], ["noise", 10.81], ["hum", 7.81]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.62, 2.83, 1.89, 6.18, 0.57, 2.94, 2.17, 0.85, 1.9, 1.24, 2.71, 2.6, 1.39, 1.81, 0.86, 1.42, 0.58, 2.44, 1.25, 2.25, 3.0, 1.41, 36.92]} \ No newline at end of file diff --git a/annotations_filtered/-e6lEsIUf3U_filtered.json b/annotations_filtered/-e6lEsIUf3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..112d37605f26eee718e9e16fb66758e6b2c1cf5b --- /dev/null +++ b/annotations_filtered/-e6lEsIUf3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.26], [13.0, 13.29], [14.0, 14.93], [19.0, 19.45], [23.0, 25.3], [27.0, 26.72], [29.0, 29.27], [30.0, 30.48], [38.0, 39.66], [43.0, 46.43], [48.0, 50.23], [51.0, 53.11], [54.0, 55.78], [68.0, 71.86], [75.0, 77.65], [80.0, 80.64], [81.0, 81.84], [87.0, 86.86], [89.0, 90.04], [92.0, 92.45], [94.0, 94.12], [95.0, 95.61], [96.0, 96.7], [97.0, 97.43], [100.0, 100.3], [106.0, 106.79], [109.0, 111.57], [113.0, 114.15], [116.0, 118.12], [120.0, 120.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.82, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 73.97, 77.53, 69.2, 0.0, 76.7, 56.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 95.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.26, 0.29, 0.93, 0.45, 2.3, -0.28, 0.27, 0.48, 1.66, 3.43, 2.23, 2.11, 1.78, 3.86, 2.65, 0.64, 0.84, -0.14, 1.04, 0.45, 0.12, 0.61, 0.7, 0.43, 0.3, 0.79, 2.57, 1.15, 2.12, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/-eIH1jFAGlY_filtered.json b/annotations_filtered/-eIH1jFAGlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f956273a7639d874a1bf0df4511bcd0477868d2 --- /dev/null +++ b/annotations_filtered/-eIH1jFAGlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 71.44], [73.0, 94.1], [96.0, 96.82], [98.0, 98.42]], "keep_status": [true, true, false, false], "silence_prob": [35.55, 31.99, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 17.18], ["mains hum", 15.01], ["speech", 13.24]], [["music", 30.78], ["fart", 8.25], ["livestock, farm animals, working animals", 7.79]], null, null], "duration": [26.44, 21.1, 0.82, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/-eXI4uy3Mlg_filtered.json b/annotations_filtered/-eXI4uy3Mlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cf04fb4efb04497b2d31bb98b0ae5583f5a6bdd --- /dev/null +++ b/annotations_filtered/-eXI4uy3Mlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.05], [24.0, 23.92], [29.0, 37.77], [40.0, 41.52], [45.0, 47.29], [73.0, 74.6], [77.0, 77.79]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 33.96, 0.0, 36.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 68.14], ["vehicle", 12.81], ["radio", 4.14]], null, [["vehicle", 14.11], ["hum", 9.69], ["mains hum", 4.07]], null, null], "duration": [0.05, -0.08, 8.77, 1.52, 2.29, 1.6, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/-edZKfoS2V4_filtered.json b/annotations_filtered/-edZKfoS2V4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75ac5c7519d424cd3da849419b27aaa50de5570b --- /dev/null +++ b/annotations_filtered/-edZKfoS2V4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 22.45], [26.0, 26.27], [27.0, 27.6], [33.0, 32.83], [33.0, 33.74], [36.0, 37.99], [39.0, 43.31], [44.0, 45.08], [49.0, 63.64], [64.0, 69.11], [70.0, 78.88], [80.0, 82.07], [83.0, 84.45], [86.0, 94.31], [94.0, 97.19], [98.0, 98.79], [99.0, 100.55], [103.0, 102.83], [104.0, 104.53], [110.0, 110.86], [113.0, 113.93], [115.0, 121.47], [122.0, 122.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 98.44, 100.0, 100.0, 100.0, 0.0, 88.1, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.9], ["animal", 17.83], ["didgeridoo", 15.27]], null], "duration": [5.45, 0.27, 0.6, -0.17, 0.74, 1.99, 4.31, 1.08, 14.64, 5.11, 8.88, 2.07, 1.45, 8.31, 3.19, 0.79, 1.55, -0.17, 0.53, 0.86, 0.93, 6.47, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/-eocP3-Ifag_filtered.json b/annotations_filtered/-eocP3-Ifag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a0988c7c4e49021560888abe71d5369c409485 --- /dev/null +++ b/annotations_filtered/-eocP3-Ifag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [5.0, 5.39], [6.0, 6.45], [7.0, 8.23], [13.0, 15.25], [16.0, 19.35], [21.0, 22.27], [23.0, 24.14], [25.0, 25.64], [27.0, 28.09], [31.0, 32.7], [33.0, 35.28], [41.0, 43.55], [44.0, 46.75], [47.0, 47.63], [63.0, 64.3], [68.0, 68.99], [71.0, 72.25], [76.0, 76.96], [78.0, 82.81], [85.0, 85.68], [87.0, 88.52], [91.0, 92.53], [93.0, 94.04], [96.0, 95.91], [96.0, 95.94], [96.0, 95.99], [96.0, 96.09], [98.0, 98.83], [99.0, 100.67], [101.0, 124.38], [126.0, 126.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.54, 33.25, 0.0, 0.0, 0.0, 0.0, 0.0, 34.78, 34.27, 35.41, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 64.07], ["musical instrument", 11.06], ["percussion", 3.78]], [["music", 41.42], ["hum", 18.78], ["throbbing", 15.32]], null, null, null, null, null, [["throbbing", 22.64], ["music", 22.49], ["hum", 22.27]], [["music", 65.56], ["throbbing", 4.81], ["hum", 4.69]], [["music", 31.39], ["speech", 28.95], ["didgeridoo", 19.4]], null, null, null, null, null, [["music", 66.48], ["didgeridoo", 17.46], ["musical instrument", 3.86]], null, null, null, null, null, null, null, null, null, null, [["music", 75.47], ["harmonic", 3.4], ["musical instrument", 2.67]], null], "duration": [0.92, 0.39, 0.45, 1.23, 2.25, 3.35, 1.27, 1.14, 0.64, 1.09, 1.7, 2.28, 2.55, 2.75, 0.63, 1.3, 0.99, 1.25, 0.96, 4.81, 0.68, 1.52, 1.53, 1.04, -0.09, -0.06, -0.01, 0.09, 0.83, 1.67, 23.38, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/-fL94BTrFhs_filtered.json b/annotations_filtered/-fL94BTrFhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50f0b216967300878deab66b92b3ee903a4e27e9 --- /dev/null +++ b/annotations_filtered/-fL94BTrFhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [5.0, 5.8], [11.0, 30.2], [41.0, 47.63], [50.0, 55.98], [56.0, 56.03], [56.0, 56.1], [56.0, 56.13], [56.0, 56.17], [56.0, 56.2], [56.0, 56.27], [57.0, 57.23], [64.0, 66.55], [72.0, 72.69], [75.0, 76.27], [80.0, 80.16], [81.0, 82.22], [85.0, 84.96], [87.0, 87.29], [88.0, 91.96], [94.0, 94.34], [100.0, 102.49], [109.0, 110.22], [110.0, 114.84], [122.0, 126.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 68.41, 71.72, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 74.6, 0.0, 56.86, 43.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.98], ["music", 25.73], ["piano", 8.4]]], "duration": [0.4, 0.8, 19.2, 6.63, 5.98, 0.03, 0.1, 0.13, 0.17, 0.2, 0.27, 0.23, 2.55, 0.69, 1.27, 0.16, 1.22, -0.04, 0.29, 3.96, 0.34, 2.49, 1.22, 4.84, 4.08]} \ No newline at end of file diff --git a/annotations_filtered/-fMCqLBMPPo_filtered.json b/annotations_filtered/-fMCqLBMPPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cff18a8ecf110be3404aca1a5375793c6263a28 --- /dev/null +++ b/annotations_filtered/-fMCqLBMPPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.97], [26.0, 26.92], [28.0, 36.95], [40.0, 42.21], [43.0, 43.75], [44.0, 45.45], [52.0, 54.33], [64.0, 65.11], [74.0, 74.6], [79.0, 80.15], [86.0, 86.91], [89.0, 89.75], [99.0, 99.27], [101.0, 106.98], [112.0, 120.24]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.89, 0.0, 34.51, 35.3, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.44, 36.09], "audiomae_on_audioset": [[["music", 65.93], ["speech", 12.67], ["beatboxing", 3.9]], null, [["music", 80.65], ["synthesizer", 2.54], ["musical instrument", 2.39]], [["music", 55.56], ["musical instrument", 6.53], ["synthesizer", 4.04]], null, null, null, null, null, null, null, null, null, [["music", 55.06], ["musical instrument", 10.14], ["guitar", 6.05]], [["music", 74.12], ["musical instrument", 10.24], ["didgeridoo", 4.2]]], "duration": [8.97, 0.92, 8.95, 2.21, 0.75, 1.45, 2.33, 1.11, 0.6, 1.15, 0.91, 0.75, 0.27, 5.98, 8.24]} \ No newline at end of file diff --git a/annotations_filtered/-fRY1b6WAx4_filtered.json b/annotations_filtered/-fRY1b6WAx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbb29af5f0764cd7605cf41f4171a341af92fb6 --- /dev/null +++ b/annotations_filtered/-fRY1b6WAx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [5.0, 6.0], [9.0, 9.17], [17.0, 17.25], [18.0, 18.64], [21.0, 21.63], [22.0, 36.0], [38.0, 39.36], [40.0, 42.82], [45.0, 53.1], [59.0, 66.9], [68.0, 69.8], [70.0, 70.77], [72.0, 73.14], [76.0, 76.79], [78.0, 84.06], [85.0, 86.8], [88.0, 89.85], [91.0, 92.91], [94.0, 97.58], [99.0, 100.57], [101.0, 108.58], [109.0, 113.63], [124.0, 126.32], [128.0, 129.12], [132.0, 134.15], [135.0, 138.52], [139.0, 141.2], [151.0, 153.5], [154.0, 155.83], [161.0, 166.89], [168.0, 170.73], [172.0, 173.67], [174.0, 175.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 69.61, 75.88, 94.22, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 88.83, 0.0, 88.46, 54.76, 80.29, 0.0, 61.47, 88.46, 51.77, 73.97, 0.0, 49.78, 67.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.74], ["tick-tock", 5.64], ["tick", 4.07]], null, null, null], "duration": [1.24, 1.0, 0.17, 0.25, 0.64, 0.63, 14.0, 1.36, 2.82, 8.1, 7.9, 1.8, 0.77, 1.14, 0.79, 6.06, 1.8, 1.85, 1.91, 3.58, 1.57, 7.58, 4.63, 2.32, 1.12, 2.15, 3.52, 2.2, 2.5, 1.83, 5.89, 2.73, 1.67, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/-ftyIj2_b8Y_filtered.json b/annotations_filtered/-ftyIj2_b8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d6cbd965c140072bdf1bfe4252e1e546246ce4c --- /dev/null +++ b/annotations_filtered/-ftyIj2_b8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 30.03], [32.0, 34.16], [35.0, 35.78], [40.0, 40.96], [43.0, 46.6], [49.0, 48.81], [50.0, 50.35], [51.0, 51.68], [52.0, 85.6], [87.0, 111.21], [114.0, 115.8], [117.0, 129.25]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [31.07, 39.31, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0, 0.0, 31.69, 0.0, 35.28], "audiomae_on_audioset": [[["music", 16.68], ["fart", 14.07], ["sound effect", 10.58]], [["music", 28.1], ["speech", 14.39], ["tabla", 3.64]], null, null, [["music", 37.85], ["throbbing", 21.23], ["hum", 9.94]], null, null, null, null, [["music", 62.41], ["smash, crash", 5.64], ["breaking", 4.82]], null, [["music", 81.67], ["synthesizer", 5.96], ["drum machine", 2.6]]], "duration": [5.03, 2.16, 0.78, 0.96, 3.6, -0.19, 0.35, 0.68, 33.6, 24.21, 1.8, 12.25]} \ No newline at end of file diff --git a/annotations_filtered/-fvfHqNEmGU_filtered.json b/annotations_filtered/-fvfHqNEmGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..410126157cd2c1e99a2e5b494a37cc75f1e3441b --- /dev/null +++ b/annotations_filtered/-fvfHqNEmGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.89], [19.0, 22.15], [23.0, 27.14], [30.0, 35.6], [40.0, 107.1]], "keep_status": [false, true, true, true, false], "silence_prob": [29.47, 31.46, 31.84, 31.75, 0.0], "audiomae_on_audioset": [[["music", 58.32], ["speech", 15.61], ["animal", 3.81]], [["hum", 39.92], ["throbbing", 14.07], ["mains hum", 11.6]], [["hum", 27.98], ["music", 21.08], ["mains hum", 15.02]], [["hum", 24.13], ["music", 10.41], ["throbbing", 8.46]], null], "duration": [8.89, 3.15, 4.14, 5.6, 67.1]} \ No newline at end of file diff --git a/annotations_filtered/-gZPZLSUZZ0_filtered.json b/annotations_filtered/-gZPZLSUZZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3afb89f53466f4c9da7f0a1e136295a584cbad3d --- /dev/null +++ b/annotations_filtered/-gZPZLSUZZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.49], [25.0, 26.38], [27.0, 31.23], [33.0, 33.3], [39.0, 40.54], [46.0, 47.36], [51.0, 51.81], [54.0, 54.08], [54.0, 55.16], [56.0, 57.94], [60.0, 60.71], [63.0, 63.26], [66.0, 66.99], [68.0, 69.58], [71.0, 70.71], [71.0, 71.04], [73.0, 74.02], [75.0, 76.77], [78.0, 79.71], [80.0, 82.04], [84.0, 85.09], [87.0, 88.3], [89.0, 92.18], [94.0, 94.24], [96.0, 96.38], [97.0, 98.19], [100.0, 99.96], [100.0, 101.09], [102.0, 102.17], [104.0, 104.7], [107.0, 107.84], [109.0, 111.74], [113.0, 116.18], [117.0, 118.62], [120.0, 122.81], [124.0, 125.0], [126.0, 125.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 97.64, 0.0, 99.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 1.38, 4.23, 0.3, 1.54, 1.36, 0.81, 0.08, 1.16, 1.94, 0.71, 0.26, 0.99, 1.58, -0.29, 0.04, 1.02, 1.77, 1.71, 2.04, 1.09, 1.3, 3.18, 0.24, 0.38, 1.19, -0.04, 1.09, 0.17, 0.7, 0.84, 2.74, 3.18, 1.62, 2.81, 1.0, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/-gkBCCbycmQ_filtered.json b/annotations_filtered/-gkBCCbycmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0e9c7009cff9c7f71c661088d2cd744d421e8eb --- /dev/null +++ b/annotations_filtered/-gkBCCbycmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [4.0, 5.32], [6.0, 6.74], [8.0, 9.34], [10.0, 14.81], [15.0, 19.41], [23.0, 25.37], [27.0, 30.69], [32.0, 32.83], [33.0, 35.33], [36.0, 36.88], [37.0, 36.95], [38.0, 38.58], [40.0, 46.11], [47.0, 48.83], [49.0, 55.92], [57.0, 61.75], [63.0, 65.42], [66.0, 68.77], [72.0, 73.26], [74.0, 75.98], [76.0, 76.06], [76.0, 82.66], [84.0, 87.4], [90.0, 91.74], [92.0, 93.39], [100.0, 104.16], [105.0, 108.62], [110.0, 115.89], [117.0, 118.88], [121.0, 122.67], [124.0, 127.33], [129.0, 130.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.82, 99.98, 100.0, 100.0, 0.0, 93.45, 0.0, 0.0, 0.0, 99.84, 0.0, 90.95, 97.83, 100.0, 99.95, 0.0, 0.0, 0.0, 99.68, 100.0, 0.0, 0.0, 93.91, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.32, 0.74, 1.34, 4.81, 4.41, 2.37, 3.69, 0.83, 2.33, 0.88, -0.05, 0.58, 6.11, 1.83, 6.92, 4.75, 2.42, 2.77, 1.26, 1.98, 0.06, 6.66, 3.4, 1.74, 1.39, 4.16, 3.62, 5.89, 1.88, 1.67, 3.33, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/-h62m4d4MmA_filtered.json b/annotations_filtered/-h62m4d4MmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfc73db4988c974902db416e098101cdbb897491 --- /dev/null +++ b/annotations_filtered/-h62m4d4MmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.96], [17.0, 17.22], [20.0, 35.23], [42.0, 41.99], [52.0, 53.47], [57.0, 57.5], [67.0, 67.53], [72.0, 72.84], [74.0, 78.8], [82.0, 90.64], [94.0, 99.4], [101.0, 101.24], [105.0, 104.73], [118.0, 119.58], [120.0, 120.56], [128.0, 128.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.21, 0.0, 33.67, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 32.49, 30.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["crowd", 34.57], ["cheering", 21.28], ["speech", 18.97]], null, [["music", 78.57], ["didgeridoo", 3.85], ["musical instrument", 3.78]], null, null, null, null, null, [["didgeridoo", 58.94], ["music", 27.47], ["musical instrument", 4.23]], [["music", 63.17], ["didgeridoo", 13.09], ["musical instrument", 5.25]], [["music", 50.92], ["didgeridoo", 13.33], ["foghorn", 7.75]], null, null, null, null, null], "duration": [8.96, 0.22, 15.23, -0.01, 1.47, 0.5, 0.53, 0.84, 4.8, 8.64, 5.4, 0.24, -0.27, 1.58, 0.56, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/-heLeiCeD58_filtered.json b/annotations_filtered/-heLeiCeD58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e17a42fe36a1bf6df28d3afe0dcd5a1f95588947 --- /dev/null +++ b/annotations_filtered/-heLeiCeD58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.64], [4.0, 4.89], [8.0, 9.02], [10.0, 12.75], [13.0, 16.02], [17.0, 19.08], [20.0, 20.34], [22.0, 23.62], [25.0, 27.04], [30.0, 34.99], [38.0, 38.67], [41.0, 44.1], [44.0, 45.42], [48.0, 50.89], [57.0, 57.59], [59.0, 58.97], [62.0, 62.46], [65.0, 65.38], [70.0, 71.34], [73.0, 73.53], [88.0, 88.92], [94.0, 94.59], [98.0, 98.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.86, 74.6, 63.1, 0.0, 0.0, 70.44, 68.02, 0.0, 38.43, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 13.43], ["thunk", 8.42], ["mains hum", 7.1]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.89, 1.02, 2.75, 3.02, 2.08, 0.34, 1.62, 2.04, 4.99, 0.67, 3.1, 1.42, 2.89, 0.59, -0.03, 0.46, 0.38, 1.34, 0.53, 0.92, 0.59, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/-hl0hUWyqoU_filtered.json b/annotations_filtered/-hl0hUWyqoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00c99409a65074e79b32ba51fca0752e653d924c --- /dev/null +++ b/annotations_filtered/-hl0hUWyqoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.4], [12.0, 15.36], [16.0, 16.46], [16.0, 23.52], [28.0, 28.17], [29.0, 44.61], [47.0, 73.09], [74.0, 77.89], [79.0, 79.95], [85.0, 86.12], [92.0, 95.35], [96.0, 99.62], [102.0, 102.66], [104.0, 105.02], [108.0, 109.17], [112.0, 112.19], [115.0, 115.52], [120.0, 121.8], [124.0, 124.46]], "keep_status": [true, true, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [31.96, 32.84, 0.0, 33.24, 0.0, 33.3, 30.88, 39.8, 0.0, 0.0, 36.28, 33.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.08], ["foghorn", 15.45], ["theremin", 7.03]], [["music", 29.88], ["cello", 19.04], ["double bass", 17.88]], null, [["music", 67.3], ["cello", 3.95], ["theremin", 3.47]], null, [["music", 62.97], ["cello", 11.62], ["bowed string instrument", 5.57]], [["music", 34.57], ["cello", 23.27], ["theremin", 9.84]], [["music", 45.0], ["middle eastern music", 4.73], ["musical instrument", 2.93]], null, null, [["music", 63.03], ["theremin", 12.18], ["foghorn", 3.42]], [["music", 21.78], ["hum", 7.19], ["foghorn", 5.19]], null, null, null, null, null, null, null], "duration": [3.4, 3.36, 0.46, 7.52, 0.17, 15.61, 26.09, 3.89, 0.95, 1.12, 3.35, 3.62, 0.66, 1.02, 1.17, 0.19, 0.52, 1.8, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/-hqNz9Ve-Hs_filtered.json b/annotations_filtered/-hqNz9Ve-Hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d91154874c1dbba6e51d22b424bec5df24762c2 --- /dev/null +++ b/annotations_filtered/-hqNz9Ve-Hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [7.0, 7.45], [8.0, 13.07], [21.0, 23.5], [25.0, 27.09], [27.0, 29.56], [31.0, 31.85], [33.0, 34.79], [37.0, 39.95], [43.0, 46.5], [49.0, 55.9]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 51.39, 43.71, 51.23, 39.18, 0.0, 0.0, 56.48, 46.97, 40.5], "audiomae_on_audioset": [null, null, null, [["music", 63.47], ["singing bowl", 5.65], ["speech", 2.6]], null, [["hum", 19.26], ["music", 17.72], ["mains hum", 14.69]], null, null, null, [["music", 21.23], ["speech", 15.97], ["hiccup", 6.67]], [["hum", 28.96], ["speech", 21.85], ["mains hum", 14.52]]], "duration": [0.22, 0.45, 5.07, 2.5, 2.09, 2.56, 0.85, 1.79, 2.95, 3.5, 6.9]} \ No newline at end of file diff --git a/annotations_filtered/-i6m1i3JLaM_filtered.json b/annotations_filtered/-i6m1i3JLaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eef22f60c41df8ba45a264aeaeeb836f23bc892c --- /dev/null +++ b/annotations_filtered/-i6m1i3JLaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.71], [24.0, 24.88], [26.0, 26.32], [31.0, 31.38], [39.0, 43.92], [45.0, 46.58], [47.0, 69.84], [74.0, 74.17], [75.0, 76.03], [77.0, 77.8], [78.0, 78.44], [79.0, 82.68], [84.0, 85.83], [90.0, 89.85], [91.0, 92.62], [93.0, 93.83], [95.0, 95.79], [96.0, 97.07], [98.0, 98.14], [100.0, 100.85], [102.0, 102.98], [104.0, 105.19], [108.0, 109.11], [112.0, 112.28], [113.0, 114.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 56.93], ["hum", 13.07], ["mains hum", 11.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 0.88, 0.32, 0.38, 4.92, 1.58, 22.84, 0.17, 1.03, 0.8, 0.44, 3.68, 1.83, -0.15, 1.62, 0.83, 0.79, 1.07, 0.14, 0.85, 0.98, 1.19, 1.11, 0.28, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/-i9Fv-znJx0_filtered.json b/annotations_filtered/-i9Fv-znJx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2336998c1a563e47d4036629489660ae4abc2278 --- /dev/null +++ b/annotations_filtered/-i9Fv-znJx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.84], [19.0, 19.45], [20.0, 21.39], [22.0, 29.67], [32.0, 35.43], [37.0, 37.44]], "keep_status": [true, false, false, true, true, false], "silence_prob": [36.32, 0.0, 0.0, 33.5, 32.02, 0.0], "audiomae_on_audioset": [[["speech", 22.68], ["music", 20.14], ["cattle, bovinae", 13.58]], null, null, [["music", 35.89], ["speech", 20.88], ["synthesizer", 3.26]], [["music", 37.85], ["speech", 25.64], ["sidetone", 2.52]], null], "duration": [5.84, 0.45, 1.39, 7.67, 3.43, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/-i9mrpATCms_filtered.json b/annotations_filtered/-i9mrpATCms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2870ba8d0c0f454a6ab9c6273a15eb3a36c9de27 --- /dev/null +++ b/annotations_filtered/-i9mrpATCms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.69], [10.0, 10.4], [13.0, 14.61], [18.0, 18.01], [21.0, 21.49], [28.0, 29.22], [30.0, 37.99], [60.0, 59.63], [60.0, 62.14], [64.0, 64.29], [69.0, 69.89], [71.0, 72.71], [73.0, 74.56], [75.0, 77.97], [79.0, 80.45], [81.0, 81.77], [85.0, 88.59], [90.0, 89.95], [90.0, 90.1], [90.0, 94.68], [96.0, 98.04], [98.0, 99.57], [101.0, 102.51], [104.0, 107.5], [108.0, 111.2], [113.0, 114.18], [120.0, 120.41], [127.0, 128.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 100.0, 0.0, 0.0, 99.96, 92.8, 0.0, 0.0, 100.0, 92.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 38.07], ["sidetone", 31.4], ["noise", 10.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.69, 0.4, 1.61, 0.01, 0.49, 1.22, 7.99, -0.37, 2.14, 0.29, 0.89, 1.71, 1.56, 2.97, 1.45, 0.77, 3.59, -0.05, 0.1, 4.68, 2.04, 1.57, 1.51, 3.5, 3.2, 1.18, 0.41, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/-it68CFJkNg_filtered.json b/annotations_filtered/-it68CFJkNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..515ae31543a4828b6afebdeb896c249a50e8629c --- /dev/null +++ b/annotations_filtered/-it68CFJkNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.54], [3.0, 3.94], [4.0, 4.53], [5.0, 6.76], [9.0, 14.44], [16.0, 17.71], [18.0, 24.24], [27.0, 36.85], [38.0, 38.89], [41.0, 44.95], [46.0, 46.75], [47.0, 51.9], [54.0, 54.87], [55.0, 55.0], [61.0, 62.34], [63.0, 67.95], [69.0, 69.42], [73.0, 87.32], [94.0, 93.92], [104.0, 104.08], [115.0, 115.16], [119.0, 119.74], [136.0, 136.24], [136.0, 136.75], [137.0, 137.02], [141.0, 143.48], [145.0, 151.16], [154.0, 154.8], [158.0, 159.41], [161.0, 163.46], [165.0, 168.69], [171.0, 172.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 96.54, 94.81, 0.0, 100.0, 0.0, 78.21, 0.0, 0.0, 0.0, 80.64, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 69.47, 0.0, 0.0, 99.52, 39.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.93], ["bow-wow", 9.57], ["animal", 9.53]], null, null, null, null, [["speech", 41.91], ["music", 27.07], ["hum", 4.46]], null], "duration": [1.54, 0.94, 0.53, 1.76, 5.44, 1.71, 6.24, 9.85, 0.89, 3.95, 0.75, 4.9, 0.87, 0.0, 1.34, 4.95, 0.42, 14.32, -0.08, 0.08, 0.16, 0.74, 0.24, 0.75, 0.02, 2.48, 6.16, 0.8, 1.41, 2.46, 3.69, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/-iuSE7NVc8c_filtered.json b/annotations_filtered/-iuSE7NVc8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad7d346751436708898d1a1d76377dd16c0ac135 --- /dev/null +++ b/annotations_filtered/-iuSE7NVc8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 31.18], [36.0, 47.24], [49.0, 50.06], [58.0, 59.83], [63.0, 73.41], [76.0, 77.19], [79.0, 80.67], [82.0, 83.27], [83.0, 83.51], [84.0, 84.7], [94.0, 94.76], [95.0, 95.82], [101.0, 101.8], [106.0, 107.0], [108.0, 116.48], [117.0, 121.63], [124.0, 125.41], [127.0, 132.04], [133.0, 138.16], [143.0, 144.81], [146.0, 146.43], [150.0, 156.02]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [38.05, 37.25, 0.0, 0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.87, 69.74, 0.0, 54.9, 82.25, 0.0, 0.0, 84.43], "audiomae_on_audioset": [[["breaking", 22.83], ["hum", 16.24], ["music", 11.27]], [["rumble", 53.2], ["music", 19.79], ["throbbing", 2.4]], null, null, [["speech", 36.49], ["music", 28.7], ["gong", 6.0]], null, null, null, null, null, null, null, null, null, [["speech", 31.35], ["sonar", 10.83], ["music", 9.43]], null, null, null, null, null, null, null], "duration": [6.18, 11.24, 1.06, 1.83, 10.41, 1.19, 1.67, 1.27, 0.51, 0.7, 0.76, 0.82, 0.8, 1.0, 8.48, 4.63, 1.41, 5.04, 5.16, 1.81, 0.43, 6.02]} \ No newline at end of file diff --git a/annotations_filtered/-jg0_iXfTE4_filtered.json b/annotations_filtered/-jg0_iXfTE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e28a869681e66bc31e0768d03f395cec4e7ec9e5 --- /dev/null +++ b/annotations_filtered/-jg0_iXfTE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.03], [13.0, 12.97], [16.0, 16.87], [21.0, 22.91], [27.0, 27.08], [30.0, 29.88], [43.0, 43.65], [48.0, 49.2], [50.0, 52.59], [54.0, 56.3], [57.0, 62.02], [63.0, 65.75], [68.0, 68.61], [90.0, 94.9], [97.0, 99.33], [100.0, 99.54], [100.0, 100.03], [100.0, 100.4], [101.0, 125.9], [132.0, 132.39], [134.0, 145.81], [146.0, 149.72], [150.0, 152.93], [158.0, 159.44]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, false, false, true, false, true, true, true, false], "silence_prob": [30.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 30.73, 35.01, 31.11, 0.0, 30.83, 30.31, 0.0, 0.0, 0.0, 30.37, 0.0, 30.58, 49.73, 34.2, 0.0], "audiomae_on_audioset": [[["crowd", 48.97], ["cheering", 29.59], ["speech", 4.71]], null, null, null, null, null, null, null, [["music", 55.7], ["theremin", 3.6], ["civil defense siren", 3.11]], [["speech", 14.86], ["sheep", 6.19], ["crowd", 5.93]], [["hum", 31.19], ["mains hum", 22.9], ["music", 15.38]], [["speech", 37.02], ["music", 12.1], ["sidetone", 4.74]], null, [["music", 35.14], ["didgeridoo", 26.67], ["sidetone", 12.25]], [["speech", 26.18], ["music", 19.43], ["boing", 14.47]], null, null, null, [["music", 64.48], ["throbbing", 2.95], ["livestock, farm animals, working animals", 2.16]], null, [["music", 40.87], ["speech", 10.05], ["cacophony", 5.82]], [["speech", 43.17], ["rumble", 10.32], ["music", 9.11]], [["speech", 31.96], ["music", 17.33], ["hum", 5.73]], null], "duration": [2.03, -0.03, 0.87, 1.91, 0.08, -0.12, 0.65, 1.2, 2.59, 2.3, 5.02, 2.75, 0.61, 4.9, 2.33, -0.46, 0.03, 0.4, 24.9, 0.39, 11.81, 3.72, 2.93, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/-jiQdqoe1cU_filtered.json b/annotations_filtered/-jiQdqoe1cU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1736c91f814dc3b2326f9d622c1cfc37ad6ab69 --- /dev/null +++ b/annotations_filtered/-jiQdqoe1cU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.35], [28.0, 28.07], [30.0, 41.34], [42.0, 42.7], [51.0, 51.93], [53.0, 56.47], [60.0, 60.71], [61.0, 62.68], [65.0, 64.94], [67.0, 66.88], [68.0, 69.01], [71.0, 71.64], [73.0, 73.84], [74.0, 79.34], [81.0, 81.9], [86.0, 86.97], [88.0, 87.81], [89.0, 91.34], [93.0, 94.22], [96.0, 96.99], [99.0, 99.54], [101.0, 101.58], [103.0, 103.27], [106.0, 107.79], [119.0, 119.91], [123.0, 123.96], [125.0, 125.36], [129.0, 131.63]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.75, 0.0, 0.0, 34.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.36], "audiomae_on_audioset": [null, null, [["speech", 31.58], ["music", 18.51], ["fart", 12.19]], null, null, [["noise", 11.0], ["radio", 8.3], ["boing", 7.3]], null, null, null, null, null, null, null, [["hum", 31.27], ["throbbing", 15.2], ["mains hum", 13.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 32.65], ["hum", 22.84], ["music", 11.89]]], "duration": [0.35, 0.07, 11.34, 0.7, 0.93, 3.47, 0.71, 1.68, -0.06, -0.12, 1.01, 0.64, 0.84, 5.34, 0.9, 0.97, -0.19, 2.34, 1.22, 0.99, 0.54, 0.58, 0.27, 1.79, 0.91, 0.96, 0.36, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/-jpEsYBH3g4_filtered.json b/annotations_filtered/-jpEsYBH3g4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c3b7742bc6f9d95096cb76a872d8685716c7df --- /dev/null +++ b/annotations_filtered/-jpEsYBH3g4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [5.0, 5.0], [5.0, 5.44], [6.0, 6.81], [8.0, 8.43], [20.0, 21.46], [22.0, 23.11], [25.0, 26.2], [29.0, 28.78], [30.0, 29.98], [33.0, 41.15], [42.0, 44.96], [45.0, 46.41], [47.0, 47.38], [50.0, 50.25], [53.0, 56.39], [58.0, 62.38], [65.0, 76.06], [78.0, 78.53], [80.0, 81.09], [82.0, 83.52], [85.0, 86.59], [88.0, 89.02], [89.0, 91.66], [94.0, 109.98], [116.0, 116.73], [118.0, 118.44], [124.0, 129.15], [133.0, 134.45], [135.0, 135.67], [136.0, 136.71], [138.0, 137.76], [138.0, 139.21], [153.0, 160.37], [162.0, 162.04], [163.0, 166.06], [167.0, 166.75], [167.0, 168.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.53, 37.11, 0.0, 0.0, 0.0, 37.07, 96.66, 35.05, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 29.7, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 0.0, 41.03, 0.0, 42.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 38.91], ["speech", 28.42], ["theremin", 6.51]], [["music", 22.96], ["cattle, bovinae", 13.09], ["livestock, farm animals, working animals", 9.74]], null, null, null, [["music", 41.77], ["theremin", 13.11], ["whale vocalization", 12.07]], null, [["music", 43.08], ["speech", 26.07], ["hum", 4.06]], null, null, null, null, null, [["music", 49.04], ["speech", 25.76], ["didgeridoo", 7.44]], [["livestock, farm animals, working animals", 26.33], ["cattle, bovinae", 11.87], ["music", 11.6]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 46.69], ["cattle, bovinae", 21.39], ["moo", 13.68]], null, [["music", 19.52], ["speech", 12.9], ["foghorn", 5.68]], null, null], "duration": [1.6, 0.0, 0.44, 0.81, 0.43, 1.46, 1.11, 1.2, -0.22, -0.02, 8.15, 2.96, 1.41, 0.38, 0.25, 3.39, 4.38, 11.06, 0.53, 1.09, 1.52, 1.59, 1.02, 2.66, 15.98, 0.73, 0.44, 5.15, 1.45, 0.67, 0.71, -0.24, 1.21, 7.37, 0.04, 3.06, -0.25, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/-jtzzs0_bM4_filtered.json b/annotations_filtered/-jtzzs0_bM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6db02ebfedf227036339547e42e2278dc1a785a3 --- /dev/null +++ b/annotations_filtered/-jtzzs0_bM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.18], [32.0, 47.48], [49.0, 51.36], [53.0, 53.76], [56.0, 60.62], [64.0, 64.81], [68.0, 70.82], [72.0, 78.04], [78.0, 78.07], [78.0, 78.11], [80.0, 114.94], [117.0, 165.3]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.52, 46.36, 0.0, 37.16, 0.0, 64.41, 29.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 37.19], ["music", 29.79], ["hum", 13.01]], [["hum", 37.55], ["mains hum", 24.84], ["music", 18.87]], null, [["music", 33.38], ["electronic music", 11.88], ["rumble", 11.65]], null, null, [["music", 56.24], ["hum", 14.57], ["throbbing", 14.2]], null, null, null, null], "duration": [1.18, 15.48, 2.36, 0.76, 4.62, 0.81, 2.82, 6.04, 0.07, 0.11, 34.94, 48.3]} \ No newline at end of file diff --git a/annotations_filtered/-kFJKQvCrkY_filtered.json b/annotations_filtered/-kFJKQvCrkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5f9b954ec7333f97f2da098b32435c7e0e546f5 --- /dev/null +++ b/annotations_filtered/-kFJKQvCrkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [7.0, 7.37], [8.0, 9.9], [10.0, 21.59], [23.0, 24.06], [24.0, 27.67], [30.0, 37.47], [40.0, 40.29], [42.0, 42.74], [43.0, 43.75], [46.0, 46.18], [47.0, 47.28], [50.0, 52.79], [54.0, 57.45], [60.0, 60.91], [62.0, 62.82], [64.0, 64.81], [68.0, 68.93], [69.0, 79.84], [83.0, 83.37], [85.0, 85.82], [86.0, 96.08], [100.0, 100.43], [102.0, 103.15], [105.0, 106.35], [107.0, 108.06], [109.0, 109.32], [112.0, 114.07], [114.0, 115.86], [117.0, 118.35], [121.0, 121.54], [122.0, 123.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.1, 0.0, 94.81, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 94.66, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.37, 1.9, 11.59, 1.06, 3.67, 7.47, 0.29, 0.74, 0.75, 0.18, 0.28, 2.79, 3.45, 0.91, 0.82, 0.81, 0.93, 10.84, 0.37, 0.82, 10.08, 0.43, 1.15, 1.35, 1.06, 0.32, 2.07, 1.86, 1.35, 0.54, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/-kHMOXNsE2k_filtered.json b/annotations_filtered/-kHMOXNsE2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..464f698755645b2d342a8f5685b83ea1ea5f2f6d --- /dev/null +++ b/annotations_filtered/-kHMOXNsE2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [5.0, 5.48], [8.0, 8.78], [10.0, 10.91], [12.0, 12.18], [14.0, 16.85], [18.0, 18.05], [20.0, 20.71], [21.0, 21.54], [26.0, 28.05], [32.0, 31.87], [34.0, 35.21], [36.0, 43.39], [44.0, 46.53], [59.0, 59.0], [62.0, 62.31], [64.0, 64.59], [65.0, 66.66], [89.0, 89.75], [93.0, 95.17], [96.0, 96.16], [97.0, 98.51], [101.0, 100.99], [105.0, 105.8], [109.0, 111.23], [113.0, 113.14], [115.0, 115.7]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 38.22, 0.0, 0.0, 37.01, 40.64, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 37.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 48.9], ["hiccup", 13.19], ["hum", 4.75]], null, null, [["clang", 18.0], ["music", 15.54], ["ding", 5.69]], [["speech", 49.62], ["crackle", 9.74], ["sidetone", 7.17]], null, null, null, null, null, null, null, null, null, null, [["music", 55.96], ["animal", 6.53], ["sneeze", 3.47]], null, null], "duration": [0.08, 0.48, 0.78, 0.91, 0.18, 2.85, 0.05, 0.71, 0.54, 2.05, -0.13, 1.21, 7.39, 2.53, 0.0, 0.31, 0.59, 1.66, 0.75, 2.17, 0.16, 1.51, -0.01, 0.8, 2.23, 0.14, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/-kKqgjrbb6I_filtered.json b/annotations_filtered/-kKqgjrbb6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbab9e57f5154bb5842eb3f9d95a8a841e1d9739 --- /dev/null +++ b/annotations_filtered/-kKqgjrbb6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.05], [9.0, 12.6], [15.0, 16.77], [20.0, 42.48], [43.0, 44.98], [45.0, 48.34], [51.0, 53.27], [54.0, 59.48], [63.0, 63.48]], "keep_status": [true, true, false, false, false, true, false, false, false], "silence_prob": [30.57, 29.35, 0.0, 30.3, 0.0, 30.02, 44.26, 30.46, 0.0], "audiomae_on_audioset": [[["speech", 43.86], ["music", 6.87], ["sound effect", 3.91]], [["music", 19.88], ["speech", 13.71], ["boing", 10.51]], null, [["music", 59.99], ["speech", 21.97], ["throbbing", 2.18]], null, [["speech", 30.53], ["music", 21.81], ["hum", 16.51]], [["speech", 31.55], ["theremin", 22.62], ["music", 17.7]], [["speech", 51.79], ["music", 28.98], ["musical instrument", 1.15]], null], "duration": [2.05, 3.6, 1.77, 22.48, 1.98, 3.34, 2.27, 5.48, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/-kYzHmPDZwo_filtered.json b/annotations_filtered/-kYzHmPDZwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d9c614da1a01ac91ff2b63dbcd189f5546d7847 --- /dev/null +++ b/annotations_filtered/-kYzHmPDZwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [5.0, 26.35], [28.0, 30.86], [31.0, 31.29], [41.0, 69.25], [86.0, 87.05], [95.0, 98.02], [99.0, 104.57], [111.0, 113.16], [117.0, 121.85], [135.0, 136.11], [147.0, 147.38], [159.0, 159.27], [160.0, 160.81], [166.0, 165.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.26, 92.8, 0.0, 44.2, 0.0, 77.36, 48.48, 86.45, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.85], ["speech", 18.51], ["synthesizer", 4.84]], null, null, [["music", 33.46], ["speech", 14.93], ["fly, housefly", 7.96]], null, null, [["music", 49.01], ["bleat", 11.72], ["speech", 11.47]], null, null, null, null, null, null, null], "duration": [1.25, 21.35, 2.86, 0.29, 28.25, 1.05, 3.02, 5.57, 2.16, 4.85, 1.11, 0.38, 0.27, 0.81, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/-kkP1Pvzvgs_filtered.json b/annotations_filtered/-kkP1Pvzvgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f9815b85ae9002bbdfb18ca762f44d31a509638 --- /dev/null +++ b/annotations_filtered/-kkP1Pvzvgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.98], [30.0, 88.32], [94.0, 98.36], [100.0, 107.08]], "keep_status": [false, false, false, true], "silence_prob": [99.82, 0.0, 35.75, 34.52], "audiomae_on_audioset": [null, null, [["whale vocalization", 59.8], ["noise", 27.17], ["music", 2.82]], [["whale vocalization", 24.71], ["sidetone", 15.24], ["noise", 8.28]]], "duration": [4.98, 58.32, 4.36, 7.08]} \ No newline at end of file diff --git a/annotations_filtered/-lAXOMpPqYM_filtered.json b/annotations_filtered/-lAXOMpPqYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa42fc5ed18800671665ac98485cbfb9b05b5c11 --- /dev/null +++ b/annotations_filtered/-lAXOMpPqYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 67.78], [68.0, 67.81], [70.0, 70.51], [73.0, 73.09], [81.0, 80.74], [82.0, 82.93], [84.0, 85.14], [86.0, 86.7], [87.0, 90.68], [92.0, 93.04], [94.0, 94.36], [109.0, 109.29], [111.0, 119.43]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.96, 0.0, 0.0, 0.0, 33.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 32.76], ["insect", 19.62], ["fly, housefly", 5.43]], null, null, null, [["buzz", 27.71], ["insect", 21.36], ["hum", 18.82]]], "duration": [67.78, -0.19, 0.51, 0.09, -0.26, 0.93, 1.14, 0.7, 3.68, 1.04, 0.36, 0.29, 8.43]} \ No newline at end of file diff --git a/annotations_filtered/-lX6P0PFKy4_filtered.json b/annotations_filtered/-lX6P0PFKy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed85b07d9f82bf1a87846a5507c3e464e1089a5d --- /dev/null +++ b/annotations_filtered/-lX6P0PFKy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.28], [9.0, 10.37], [14.0, 18.57], [20.0, 21.24], [22.0, 96.45]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.38], ["breaking", 17.29], ["glass", 7.75]], null, null], "duration": [1.28, 1.37, 4.57, 1.24, 74.45]} \ No newline at end of file diff --git a/annotations_filtered/-mHhr-aaLnI_filtered.json b/annotations_filtered/-mHhr-aaLnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d01bf541aa0446d742fbc9454e6870aa65b5879 --- /dev/null +++ b/annotations_filtered/-mHhr-aaLnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.97], [29.0, 34.32], [43.0, 43.55], [48.0, 47.71], [50.0, 51.78], [56.0, 56.64], [57.0, 58.16], [60.0, 60.89], [62.0, 62.87], [66.0, 66.72], [71.0, 71.19], [72.0, 74.83], [77.0, 77.62], [79.0, 79.37], [82.0, 81.9], [83.0, 83.35], [84.0, 84.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.13, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.97, 5.32, 0.55, -0.29, 1.78, 0.64, 1.16, 0.89, 0.87, 0.72, 0.19, 2.83, 0.62, 0.37, -0.1, 0.35, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/-mXoZz1dqMQ_filtered.json b/annotations_filtered/-mXoZz1dqMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3bc18341096c73c4be59c606642c84d531702a --- /dev/null +++ b/annotations_filtered/-mXoZz1dqMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 26.77], [29.0, 29.89], [32.0, 33.03], [51.0, 52.73], [66.0, 66.07], [68.0, 68.32], [69.0, 69.2], [74.0, 78.04], [83.0, 84.69], [87.0, 89.36], [90.0, 90.42], [94.0, 95.25], [98.0, 98.49], [104.0, 106.05], [110.0, 111.96], [112.0, 113.43], [114.0, 116.34], [119.0, 128.31]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 69.07, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 70.72, 47.05], "audiomae_on_audioset": [[["music", 20.11], ["speech", 15.1], ["crowd", 11.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.81], ["hum", 16.45], ["mains hum", 5.0]]], "duration": [7.77, 0.89, 1.03, 1.73, 0.07, 0.32, 0.2, 4.04, 1.69, 2.36, 0.42, 1.25, 0.49, 2.05, 1.96, 1.43, 2.34, 9.31]} \ No newline at end of file diff --git a/annotations_filtered/-meMCDrOmpo_filtered.json b/annotations_filtered/-meMCDrOmpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2d082eee0989b56683e4bca09354c4c7dcef2f7 --- /dev/null +++ b/annotations_filtered/-meMCDrOmpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.29], [6.0, 7.2], [8.0, 9.36], [23.0, 23.08], [25.0, 26.06], [28.0, 27.89], [34.0, 36.19], [39.0, 41.32], [42.0, 42.9], [48.0, 51.14], [52.0, 52.44], [58.0, 58.21], [59.0, 58.85], [60.0, 59.93], [62.0, 61.8], [70.0, 70.16], [72.0, 72.27], [78.0, 79.24], [85.0, 88.82], [91.0, 99.05], [100.0, 100.68], [101.0, 102.12], [105.0, 110.34], [112.0, 116.46], [116.0, 116.5], [117.0, 117.39], [118.0, 118.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 98.86, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.52, 39.14, 0.0, 0.0, 40.59, 45.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.44], ["hum", 5.26], ["music", 4.62]], [["speech", 44.2], ["music", 22.02], ["fart", 4.26]], null, null, [["speech", 34.73], ["music", 27.15], ["sidetone", 2.57]], [["speech", 47.51], ["music", 26.15], ["sidetone", 3.34]], null, null, null], "duration": [1.29, 1.2, 1.36, 0.08, 1.06, -0.11, 2.19, 2.32, 0.9, 3.14, 0.44, 0.21, -0.15, -0.07, -0.2, 0.16, 0.27, 1.24, 3.82, 8.05, 0.68, 1.12, 5.34, 4.46, 0.5, 0.39, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/-mexzYsMSro_filtered.json b/annotations_filtered/-mexzYsMSro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31fb1b9538cede61279b3d925483f0f002152a3e --- /dev/null +++ b/annotations_filtered/-mexzYsMSro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.65], [21.0, 23.38], [26.0, 26.1], [27.0, 28.53], [30.0, 41.2], [42.0, 43.82], [45.0, 46.23], [48.0, 48.36], [49.0, 52.39], [53.0, 64.67], [68.0, 70.65], [71.0, 73.26], [75.0, 78.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.52, 96.42, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 98.19, 69.47, 78.89, 65.32, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.65, 2.38, 0.1, 1.53, 11.2, 1.82, 1.23, 0.36, 3.39, 11.67, 2.65, 2.26, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/-mjnbKL7fHQ_filtered.json b/annotations_filtered/-mjnbKL7fHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed4670cd02404795567f837d6f426c6310aa5319 --- /dev/null +++ b/annotations_filtered/-mjnbKL7fHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.88], [22.0, 30.25], [32.0, 34.5], [37.0, 38.35], [43.0, 44.47], [46.0, 55.73], [56.0, 56.94], [64.0, 84.62], [87.0, 91.15], [92.0, 92.85], [94.0, 95.27], [96.0, 97.31], [99.0, 102.25], [104.0, 114.07], [115.0, 116.19]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.96, 95.23, 0.0, 0.0, 45.65, 0.0, 41.81, 96.04, 0.0, 0.0, 0.0, 100.0, 73.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["boing", 34.41], ["music", 29.77], ["speech", 4.75]], null, [["music", 58.87], ["synthesizer", 11.16], ["throbbing", 3.8]], null, null, null, null, null, null, null], "duration": [0.88, 8.25, 2.5, 1.35, 1.47, 9.73, 0.94, 20.62, 4.15, 0.85, 1.27, 1.31, 3.25, 10.07, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/-mlfefNP8cw_filtered.json b/annotations_filtered/-mlfefNP8cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33d6de553379664fa529d5788ee2fb5a566a9974 --- /dev/null +++ b/annotations_filtered/-mlfefNP8cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.72], [5.0, 5.21], [25.0, 25.12], [33.0, 46.65], [47.0, 48.24], [50.0, 51.78], [57.0, 57.65], [59.0, 62.45], [67.0, 74.09], [83.0, 85.09], [87.0, 88.47], [91.0, 91.17], [92.0, 91.94], [92.0, 93.24], [127.0, 127.5], [128.0, 127.58], [133.0, 133.22], [136.0, 135.73], [136.0, 142.45], [149.0, 149.69], [151.0, 151.97]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.89, 0.0, 0.0, 0.0, 35.6, 36.86, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 78.47], ["theremin", 2.65], ["musical instrument", 2.64]], null, null, null, [["music", 62.41], ["guitar", 5.82], ["bass guitar", 5.45]], [["music", 61.53], ["guitar", 4.97], ["effects unit", 3.02]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.28, 0.21, 0.12, 13.65, 1.24, 1.78, 0.65, 3.45, 7.09, 2.09, 1.47, 0.17, -0.06, 1.24, 0.5, -0.42, 0.22, -0.27, 6.45, 0.69, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/-n3qpOM31Pc_filtered.json b/annotations_filtered/-n3qpOM31Pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..addda2069b9a47a83f7e0b25920e6df481cb2442 --- /dev/null +++ b/annotations_filtered/-n3qpOM31Pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.51], [4.0, 4.9], [6.0, 6.07], [6.0, 8.51], [10.0, 10.71], [13.0, 16.48], [22.0, 22.37], [27.0, 27.57], [32.0, 33.29], [36.0, 36.71], [41.0, 42.21], [48.0, 48.41], [50.0, 50.97], [54.0, 53.84], [55.0, 56.12], [67.0, 67.41], [84.0, 84.25], [91.0, 91.64], [93.0, 92.7], [97.0, 97.55], [99.0, 100.23]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.18, 0.0, 0.0, 43.25, 0.0, 43.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 39.5], ["water", 16.98], ["liquid", 10.26]], null, null, [["mains hum", 58.06], ["hum", 38.61], ["throbbing", 0.65]], null, [["music", 21.55], ["thunk", 11.16], ["dial tone", 10.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 0.9, 0.07, 2.51, 0.71, 3.48, 0.37, 0.57, 1.29, 0.71, 1.21, 0.41, 0.97, -0.16, 1.12, 0.41, 0.25, 0.64, -0.3, 0.55, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/-nIwFGmgYMs_filtered.json b/annotations_filtered/-nIwFGmgYMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bd67be412673383c6c34528397d6e70e0e7687a --- /dev/null +++ b/annotations_filtered/-nIwFGmgYMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.15], [15.0, 22.38], [25.0, 27.18], [31.0, 55.95], [59.0, 58.97], [59.0, 59.0], [59.0, 59.04], [59.0, 59.07], [59.0, 59.1], [59.0, 59.14], [59.0, 59.17], [59.0, 59.21], [59.0, 59.24], [59.0, 59.48], [59.0, 59.51], [61.0, 70.95], [71.0, 74.49]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [41.64, 29.77, 99.99, 29.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.85, 92.31], "audiomae_on_audioset": [[["music", 36.5], ["telephone dialing, dtmf", 12.19], ["synthesizer", 11.64]], [["throbbing", 20.92], ["hum", 19.86], ["speech", 19.18]], null, [["speech", 47.71], ["hum", 9.68], ["music", 8.25]], null, null, null, null, null, null, null, null, null, null, null, [["music", 26.34], ["cacophony", 21.56], ["hum", 11.37]], null], "duration": [11.15, 7.38, 2.18, 24.95, -0.03, 0.0, 0.04, 0.07, 0.1, 0.14, 0.17, 0.21, 0.24, 0.48, 0.51, 9.95, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/-nX_jQxWFN4_filtered.json b/annotations_filtered/-nX_jQxWFN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31b6392dfce51361daa4567fcad04a45caf0bc77 --- /dev/null +++ b/annotations_filtered/-nX_jQxWFN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.1], [9.0, 10.23], [12.0, 13.61], [18.0, 21.9], [23.0, 22.94], [23.0, 25.41], [29.0, 29.46], [36.0, 36.71], [38.0, 39.26], [60.0, 60.39], [62.0, 63.0], [72.0, 73.82], [75.0, 75.74], [76.0, 76.54], [78.0, 78.78], [82.0, 82.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.64, 0.0, 0.0, 74.92, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 1.23, 1.61, 3.9, -0.06, 2.41, 0.46, 0.71, 1.26, 0.39, 1.0, 1.82, 0.74, 0.54, 0.78, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/-nboVp_nTkg_filtered.json b/annotations_filtered/-nboVp_nTkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c6d762e7b63ee8a52ba39ce0766dfa1db1cd794 --- /dev/null +++ b/annotations_filtered/-nboVp_nTkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.97], [10.0, 65.2], [66.0, 66.7], [69.0, 70.75], [71.0, 71.71], [73.0, 75.27], [77.0, 77.38]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [-0.03, 55.2, 0.7, 1.75, 0.71, 2.27, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/-ncFDuKdgNE_filtered.json b/annotations_filtered/-ncFDuKdgNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edaac412309898ac43d3b755ab0571b02faebee8 --- /dev/null +++ b/annotations_filtered/-ncFDuKdgNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.04], [14.0, 14.35], [18.0, 21.51], [22.0, 23.55], [24.0, 23.99], [24.0, 24.95], [27.0, 27.82], [28.0, 31.78], [36.0, 37.44], [41.0, 43.58], [49.0, 50.68], [61.0, 85.33], [94.0, 94.8], [100.0, 105.31], [106.0, 107.23], [116.0, 118.79]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.66, 0.0, 0.0, 0.0, 0.0, 36.86, 0.0, 34.25, 0.0, 31.16, 0.0, 34.12, 0.0, 34.79], "audiomae_on_audioset": [null, null, [["speech", 50.52], ["splash, splatter", 13.51], ["boing", 2.71]], null, null, null, null, [["animal", 14.27], ["music", 11.04], ["boing", 5.22]], null, [["synthesizer", 20.73], ["music", 12.57], ["noise", 8.0]], null, [["music", 62.89], ["speech", 7.3], ["musical instrument", 2.8]], null, [["music", 76.34], ["quack", 2.45], ["funny music", 1.88]], null, [["music", 44.89], ["speech", 21.35], ["quack", 5.0]]], "duration": [0.04, 0.35, 3.51, 1.55, -0.01, 0.95, 0.82, 3.78, 1.44, 2.58, 1.68, 24.33, 0.8, 5.31, 1.23, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/-nh3g6F63qM_filtered.json b/annotations_filtered/-nh3g6F63qM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9462a429990e3cefadf8eb2be8b3bb8a92af960c --- /dev/null +++ b/annotations_filtered/-nh3g6F63qM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 6.52], [10.0, 10.57], [11.0, 11.96], [15.0, 15.74], [17.0, 18.37], [20.0, 20.61], [22.0, 21.81], [26.0, 27.99], [29.0, 33.29], [34.0, 34.96], [38.0, 39.61], [50.0, 50.53], [53.0, 53.52], [56.0, 56.2], [58.0, 59.07], [60.0, 61.13], [65.0, 67.44], [69.0, 69.79], [71.0, 71.86], [75.0, 75.66], [77.0, 77.38], [78.0, 79.74], [80.0, 81.26], [83.0, 83.83], [86.0, 89.13], [90.0, 96.6], [98.0, 98.04], [98.0, 101.21], [103.0, 103.28], [106.0, 106.56], [108.0, 112.29], [113.0, 115.43], [120.0, 120.29], [121.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.78, 87.19, 0.0, 45.14, 0.0, 0.0, 73.51, 50.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.45], ["whale vocalization", 23.72], ["sidetone", 5.19]], null, null, [["speech", 24.39], ["hum", 7.7], ["burping, eructation", 6.1]], null, null, null, null, null, null], "duration": [0.69, 1.52, 0.57, 0.96, 0.74, 1.37, 0.61, -0.19, 1.99, 4.29, 0.96, 1.61, 0.53, 0.52, 0.2, 1.07, 1.13, 2.44, 0.79, 0.86, 0.66, 0.38, 1.74, 1.26, 0.83, 3.13, 6.6, 0.04, 3.21, 0.28, 0.56, 4.29, 2.43, 0.29, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/-nk6Gs6Z_Bo_filtered.json b/annotations_filtered/-nk6Gs6Z_Bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5826d21fed8a20770ab94e41aa7bd68e838aeb22 --- /dev/null +++ b/annotations_filtered/-nk6Gs6Z_Bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.17], [11.0, 12.43], [13.0, 18.67], [45.0, 46.58], [49.0, 52.25], [63.0, 63.05], [63.0, 65.43], [74.0, 76.33], [83.0, 92.28], [93.0, 99.96], [101.0, 101.33], [102.0, 102.09], [103.0, 116.31], [117.0, 143.83], [144.0, 151.07]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 38.93, 0.0, 33.8, 0.0, 41.76, 56.33, 33.05, 37.19, 0.0, 0.0, 34.52, 34.32, 31.65], "audiomae_on_audioset": [null, null, [["thunk", 26.47], ["music", 19.13], ["speech", 12.03]], null, [["speech", 31.16], ["music", 19.87], ["fart", 6.86]], null, [["music", 35.67], ["speech", 24.05], ["didgeridoo", 2.79]], null, [["cattle, bovinae", 39.67], ["livestock, farm animals, working animals", 33.92], ["moo", 24.9]], [["music", 76.46], ["musical instrument", 3.1], ["synthesizer", 2.77]], null, null, [["fly, housefly", 61.23], ["insect", 10.26], ["music", 7.2]], [["music", 23.03], ["fly, housefly", 19.71], ["mosquito", 16.03]], [["music", 47.81], ["didgeridoo", 7.96], ["grunt", 5.63]]], "duration": [1.17, 1.43, 5.67, 1.58, 3.25, 0.05, 2.43, 2.33, 9.28, 6.96, 0.33, 0.09, 13.31, 26.83, 7.07]} \ No newline at end of file diff --git a/annotations_filtered/-nkqrSaJf1g_filtered.json b/annotations_filtered/-nkqrSaJf1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f01e875f9bae8f6fe223e121945a867b6a27cf90 --- /dev/null +++ b/annotations_filtered/-nkqrSaJf1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 26.77], [29.0, 33.76], [39.0, 48.41], [49.0, 61.62], [63.0, 64.49], [66.0, 66.61], [68.0, 70.93], [72.0, 74.33], [75.0, 75.51], [81.0, 99.39], [101.0, 102.57], [104.0, 105.81]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [84.98, 97.43, 99.05, 43.4, 0.0, 0.0, 98.19, 35.76, 0.0, 37.49, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 20.16], ["radio", 9.69], ["noise", 7.91]], null, null, null, [["speech", 55.37], ["narration, monologue", 16.68], ["hum", 7.4]], null, [["echo", 24.43], ["hum", 22.21], ["throbbing", 8.55]], null, null], "duration": [5.77, 4.76, 9.41, 12.62, 1.49, 0.61, 2.93, 2.33, 0.51, 18.39, 1.57, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/-npMZStX7dU_filtered.json b/annotations_filtered/-npMZStX7dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f8dcf0ae8e3bee5958f60149bcfa55dd52a8d1c --- /dev/null +++ b/annotations_filtered/-npMZStX7dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.83], [27.0, 43.34], [57.0, 57.45], [66.0, 68.39], [74.0, 88.5], [90.0, 97.92]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 34.78, 0.0, 32.93, 28.72, 28.99], "audiomae_on_audioset": [null, [["hum", 50.27], ["music", 17.5], ["mains hum", 12.81]], null, [["speech", 64.61], ["radio", 2.9], ["male speech, man speaking", 1.92]], [["music", 48.63], ["smash, crash", 22.59], ["whack, thwack", 5.34]], [["cattle, bovinae", 37.37], ["livestock, farm animals, working animals", 24.86], ["moo", 18.65]]], "duration": [1.83, 16.34, 0.45, 2.39, 14.5, 7.92]} \ No newline at end of file diff --git a/annotations_filtered/-nswXtzrfQU_filtered.json b/annotations_filtered/-nswXtzrfQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4752bfc59fdb0f820b050912230bdc13733dac --- /dev/null +++ b/annotations_filtered/-nswXtzrfQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [5.0, 8.83], [20.0, 23.08], [23.0, 24.17], [43.0, 46.23], [49.0, 49.84], [54.0, 54.87], [57.0, 57.33], [65.0, 65.82], [72.0, 72.55], [81.0, 80.86], [81.0, 83.44], [88.0, 87.99], [89.0, 91.05], [99.0, 99.98], [101.0, 101.29], [102.0, 102.64], [107.0, 107.54]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.26, 42.48, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.71], ["speech", 14.82], ["arrow", 7.84]], [["speech", 44.59], ["hum", 13.76], ["music", 9.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 3.83, 3.08, 1.17, 3.23, 0.84, 0.87, 0.33, 0.82, 0.55, -0.14, 2.44, -0.01, 2.05, 0.98, 0.29, 0.64, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/-o-C21COWIQ_filtered.json b/annotations_filtered/-o-C21COWIQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cc6b0ca1be3fe9f9e3e5bb3f962fc744867ec45 --- /dev/null +++ b/annotations_filtered/-o-C21COWIQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.51], [10.0, 9.81], [11.0, 11.2], [16.0, 16.16], [18.0, 18.25], [20.0, 20.6], [24.0, 24.7], [27.0, 27.48], [28.0, 30.08], [37.0, 36.98], [47.0, 48.12], [49.0, 50.28], [54.0, 56.81], [58.0, 58.82], [74.0, 74.41], [75.0, 76.79], [84.0, 85.65], [87.0, 87.13], [89.0, 90.9], [94.0, 94.26], [114.0, 117.76], [118.0, 118.62], [126.0, 126.89], [130.0, 129.83], [133.0, 135.51], [141.0, 144.49], [150.0, 151.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 70.02, 74.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, -0.19, 0.2, 0.16, 0.25, 0.6, 0.7, 0.48, 2.08, -0.02, 1.12, 1.28, 2.81, 0.82, 0.41, 1.79, 1.65, 0.13, 1.9, 0.26, 3.76, 0.62, 0.89, -0.17, 2.51, 3.49, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/-o1N2unFkSs_filtered.json b/annotations_filtered/-o1N2unFkSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a887b1a458b8f8e210290fe24b5edc4258c7a21a --- /dev/null +++ b/annotations_filtered/-o1N2unFkSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [7.0, 7.6], [11.0, 12.07], [16.0, 17.96], [19.0, 19.16], [25.0, 26.81], [35.0, 35.99], [37.0, 37.79], [43.0, 43.87]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.6, 1.07, 1.96, 0.16, 1.81, 0.99, 0.79, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/-o8b7tsVH64_filtered.json b/annotations_filtered/-o8b7tsVH64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b9de6a1b5ba3d02336c5e6ddb5c32cf189e1d47 --- /dev/null +++ b/annotations_filtered/-o8b7tsVH64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[91.0, 109.73], [111.0, 122.62]], "keep_status": [true, true], "silence_prob": [41.98, 41.93], "audiomae_on_audioset": [[["music", 39.7], ["gong", 10.03], ["hum", 7.92]], [["music", 50.39], ["hum", 10.21], ["synthesizer", 8.97]]], "duration": [18.73, 11.62]} \ No newline at end of file diff --git a/annotations_filtered/-oL4NpO7eAw_filtered.json b/annotations_filtered/-oL4NpO7eAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24954907df1b3393089e10910e4e9ead66ffc0c --- /dev/null +++ b/annotations_filtered/-oL4NpO7eAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.84], [28.0, 29.74], [33.0, 32.73], [35.0, 35.75], [41.0, 43.83], [46.0, 46.18], [52.0, 52.88], [55.0, 57.72], [63.0, 63.15], [65.0, 72.67], [77.0, 78.7], [80.0, 80.82], [83.0, 83.32], [90.0, 90.39], [101.0, 101.46], [105.0, 105.83], [109.0, 110.76], [124.0, 125.39]], "keep_status": [true, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [31.5, 0.0, 0.0, 0.0, 34.98, 0.0, 0.0, 32.18, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.16], ["boing", 9.03], ["musical instrument", 5.52]], null, null, null, [["music", 50.6], ["speech", 7.29], ["musical instrument", 2.85]], null, null, [["music", 50.28], ["boing", 3.59], ["music of latin america", 3.55]], null, [["music", 29.86], ["speech", 10.92], ["mosquito", 8.83]], null, null, null, null, null, null, null, null], "duration": [15.84, 1.74, -0.27, 0.75, 2.83, 0.18, 0.88, 2.72, 0.15, 7.67, 1.7, 0.82, 0.32, 0.39, 0.46, 0.83, 1.76, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/-oPHsR72Lfo_filtered.json b/annotations_filtered/-oPHsR72Lfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd0a446a9aac6611e0b09ce4fc69c3cc99b3b2ac --- /dev/null +++ b/annotations_filtered/-oPHsR72Lfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [3.0, 4.09], [9.0, 12.56], [41.0, 41.37], [92.0, 92.42], [97.0, 97.8], [113.0, 113.78], [115.0, 115.74], [119.0, 119.18], [124.0, 124.73], [127.0, 128.46], [129.0, 130.0], [131.0, 131.58], [141.0, 142.08]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 32.28], ["synthesizer", 11.62], ["throbbing", 8.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 1.09, 3.56, 0.37, 0.42, 0.8, 0.78, 0.74, 0.18, 0.73, 1.46, 1.0, 0.58, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/-oRm-YxsEH8_filtered.json b/annotations_filtered/-oRm-YxsEH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..818cef5f5c59d18def89785f6af7e355a25bb51d --- /dev/null +++ b/annotations_filtered/-oRm-YxsEH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 69.9], [72.0, 78.44], [80.0, 84.86], [87.0, 86.9], [88.0, 88.32], [95.0, 101.63], [104.0, 122.32], [124.0, 126.17], [127.0, 130.45]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 55.6, 99.78, 0.0, 0.0, 95.37, 31.95, 96.54, 99.26], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 17.63], ["hum", 9.85], ["gunshot, gunfire", 5.61]], null, null], "duration": [43.9, 6.44, 4.86, -0.1, 0.32, 6.63, 18.32, 2.17, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/-oeFJvhvMik_filtered.json b/annotations_filtered/-oeFJvhvMik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a63f5be7f9d03fe9b2e362b50a571fc377d0c3f --- /dev/null +++ b/annotations_filtered/-oeFJvhvMik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.18], [16.0, 15.87], [16.0, 15.9], [16.0, 17.42], [19.0, 19.94], [23.0, 24.07], [26.0, 27.16], [28.0, 29.29], [30.0, 32.76], [34.0, 34.48], [35.0, 37.42], [46.0, 47.8], [49.0, 49.92], [51.0, 53.18], [55.0, 55.43], [58.0, 63.32], [64.0, 64.5], [65.0, 65.65], [68.0, 69.25], [71.0, 72.71], [73.0, 74.26], [76.0, 77.53], [79.0, 79.54], [80.0, 80.49], [82.0, 82.48], [83.0, 83.51], [85.0, 85.53], [87.0, 91.37], [94.0, 94.26], [95.0, 95.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 100.0, 0.0, 0.0, 99.98, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, -0.13, -0.1, 1.42, 0.94, 1.07, 1.16, 1.29, 2.76, 0.48, 2.42, 1.8, 0.92, 2.18, 0.43, 5.32, 0.5, 0.65, 1.25, 1.71, 1.26, 1.53, 0.54, 0.49, 0.48, 0.51, 0.53, 4.37, 0.26, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/-opqUSOUDQY_filtered.json b/annotations_filtered/-opqUSOUDQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c672e7ee3d096d98c53a5aceee64617d56d6edf7 --- /dev/null +++ b/annotations_filtered/-opqUSOUDQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.12], [13.0, 13.42], [15.0, 14.99], [16.0, 16.8], [20.0, 25.79], [27.0, 26.65], [27.0, 26.76], [30.0, 29.93], [31.0, 34.21], [35.0, 37.98], [42.0, 42.99], [44.0, 44.69], [46.0, 49.87], [50.0, 51.31], [53.0, 53.87], [55.0, 57.01], [59.0, 64.02], [66.0, 66.48], [68.0, 68.18], [72.0, 75.41], [80.0, 81.01], [83.0, 82.73], [84.0, 85.13], [86.0, 86.97], [88.0, 90.22], [95.0, 98.36], [100.0, 100.53], [102.0, 102.2], [104.0, 106.81], [107.0, 109.76], [111.0, 112.63], [116.0, 116.14], [116.0, 116.67], [118.0, 118.57], [120.0, 120.34], [121.0, 122.74], [126.0, 126.15], [136.0, 136.75], [138.0, 139.02], [146.0, 151.68], [155.0, 155.76], [158.0, 158.19], [164.0, 165.35], [166.0, 166.9], [169.0, 169.65], [171.0, 171.49], [172.0, 173.08], [175.0, 184.0], [185.0, 185.5], [192.0, 197.02], [202.0, 202.63], [204.0, 204.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 93.13, 0.0, 0.0, 97.92, 82.25, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 69.61, 54.5, 0.0, 0.0, 61.97, 42.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 34.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.84], ["burping, eructation", 10.7], ["busy signal", 9.25]], null, null, null, null, null, null, null, null, null, [["throbbing", 45.38], ["speech", 17.87], ["music", 14.08]], null, null, null, null, null, null, null, [["speech", 47.63], ["music", 17.9], ["whack, thwack", 7.31]], null, [["quack", 42.19], ["music", 12.15], ["duck", 12.09]], null, null], "duration": [2.12, 0.42, -0.01, 0.8, 5.79, -0.35, -0.24, -0.07, 3.21, 2.98, 0.99, 0.69, 3.87, 1.31, 0.87, 2.01, 5.02, 0.48, 0.18, 3.41, 1.01, -0.27, 1.13, 0.97, 2.22, 3.36, 0.53, 0.2, 2.81, 2.76, 1.63, 0.14, 0.67, 0.57, 0.34, 1.74, 0.15, 0.75, 1.02, 5.68, 0.76, 0.19, 1.35, 0.9, 0.65, 0.49, 1.08, 9.0, 0.5, 5.02, 0.63, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/-p4TkuB20bs_filtered.json b/annotations_filtered/-p4TkuB20bs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019c7018b72f8aa75a739e6a18f0df31fdfe528f --- /dev/null +++ b/annotations_filtered/-p4TkuB20bs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.25], [16.0, 16.23], [18.0, 24.85], [33.0, 36.48], [43.0, 44.22], [44.0, 56.44], [66.0, 69.11]], "keep_status": [true, false, false, true, false, true, false], "silence_prob": [35.87, 0.0, 75.39, 36.97, 0.0, 29.99, 32.77], "audiomae_on_audioset": [[["speech", 36.11], ["music", 20.41], ["hum", 6.98]], null, null, [["speech", 30.55], ["hum", 26.34], ["rumble", 7.89]], null, [["throbbing", 29.68], ["hum", 19.35], ["music", 13.8]], [["music", 40.65], ["hum", 24.19], ["throbbing", 14.38]]], "duration": [9.25, 0.23, 6.85, 3.48, 1.22, 12.44, 3.11]} \ No newline at end of file diff --git a/annotations_filtered/-pEKUJ9MADs_filtered.json b/annotations_filtered/-pEKUJ9MADs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b175c9331f72ca9d12d43f419c274012ef8ba19b --- /dev/null +++ b/annotations_filtered/-pEKUJ9MADs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [3.0, 4.67], [8.0, 23.09], [24.0, 25.05], [28.0, 30.25], [32.0, 32.49], [35.0, 35.7], [38.0, 37.86], [41.0, 41.81], [43.0, 43.01], [52.0, 52.69], [60.0, 60.34], [75.0, 76.13], [99.0, 99.3], [101.0, 101.88], [107.0, 106.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 1.67, 15.09, 1.05, 2.25, 0.49, 0.7, -0.14, 0.81, 0.01, 0.69, 0.34, 1.13, 0.3, 0.88, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/-pKrpqoPu1o_filtered.json b/annotations_filtered/-pKrpqoPu1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5433da0d80954e9304a5727e2e27ca70c9f860c --- /dev/null +++ b/annotations_filtered/-pKrpqoPu1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 29.03], [40.0, 44.95], [47.0, 61.45], [66.0, 121.1]], "keep_status": [false, false, false, false], "silence_prob": [32.75, 37.77, 33.17, 0.0], "audiomae_on_audioset": [[["music", 54.98], ["throbbing", 12.11], ["hum", 8.72]], [["music", 66.88], ["throbbing", 4.95], ["musical instrument", 2.95]], [["music", 54.3], ["hum", 10.59], ["rumble", 8.22]], null], "duration": [24.03, 4.95, 14.45, 55.1]} \ No newline at end of file diff --git a/annotations_filtered/-pXlicO85dk_filtered.json b/annotations_filtered/-pXlicO85dk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5398d1743ab0de23af8e2f6ad5694733909db53 --- /dev/null +++ b/annotations_filtered/-pXlicO85dk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.24], [12.0, 15.16], [17.0, 19.41], [21.0, 21.98], [24.0, 28.02], [34.0, 35.4], [40.0, 42.6], [44.0, 49.82], [51.0, 56.29], [57.0, 58.78], [61.0, 62.58], [63.0, 69.69], [72.0, 73.04], [77.0, 80.45], [83.0, 89.23], [91.0, 92.82], [95.0, 97.02], [98.0, 99.13], [101.0, 101.66], [102.0, 112.14], [113.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.78, 43.53, 0.0, 98.44, 0.0, 61.57, 33.83, 41.44, 0.0, 0.0, 38.15, 0.0, 93.13, 45.49, 0.0, 65.67, 0.0, 0.0, 38.22, 44.69], "audiomae_on_audioset": [null, null, [["speech", 59.91], ["sidetone", 5.42], ["hum", 4.71]], null, null, null, null, [["music", 39.43], ["speech", 23.02], ["ambient music", 6.75]], [["music", 33.62], ["theremin", 26.12], ["speech", 8.68]], null, null, [["music", 53.32], ["speech", 17.8], ["speech synthesizer", 7.59]], null, null, [["music", 40.18], ["singing bowl", 16.38], ["speech", 14.78]], null, null, null, null, [["music", 61.01], ["speech", 10.51], ["hum", 3.63]], [["music", 69.93], ["gong", 6.48], ["synthesizer", 3.09]]], "duration": [0.24, 3.16, 2.41, 0.98, 4.02, 1.4, 2.6, 5.82, 5.29, 1.78, 1.58, 6.69, 1.04, 3.45, 6.23, 1.82, 2.02, 1.13, 0.66, 10.14, 8.98]} \ No newline at end of file diff --git a/annotations_filtered/-pix6UL8ONk_filtered.json b/annotations_filtered/-pix6UL8ONk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42325b5cb5ec1948a78683d12e5c1c8719b3b27d --- /dev/null +++ b/annotations_filtered/-pix6UL8ONk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [7.0, 7.47], [16.0, 19.23], [20.0, 19.77], [35.0, 35.19], [40.0, 40.81], [64.0, 66.5], [69.0, 68.79], [70.0, 71.54], [73.0, 75.95], [78.0, 79.08], [82.0, 84.64], [86.0, 97.24], [97.0, 100.77], [104.0, 103.92], [111.0, 111.47], [115.0, 131.55]], "keep_status": [false, false, true, false, false, false, true, false, false, true, false, true, true, true, false, false, true], "silence_prob": [0.0, 0.0, 40.09, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 49.09, 0.0, 35.24, 41.58, 33.79, 0.0, 0.0, 30.26], "audiomae_on_audioset": [null, null, [["speech", 9.81], ["crying, sobbing", 7.2], ["baby cry, infant cry", 5.4]], null, null, null, [["speech", 12.57], ["rowboat, canoe, kayak", 12.32], ["horse", 10.92]], null, null, [["speech", 32.37], ["boat, water vehicle", 20.33], ["vehicle", 6.1]], null, [["speech", 29.53], ["hum", 12.96], ["eruption", 5.68]], [["music", 32.15], ["hum", 26.02], ["throbbing", 9.07]], [["music", 45.03], ["hum", 12.62], ["mains hum", 8.28]], null, null, [["music", 52.81], ["speech", 6.15], ["synthesizer", 5.21]]], "duration": [1.88, 0.47, 3.23, -0.23, 0.19, 0.81, 2.5, -0.21, 1.54, 2.95, 1.08, 2.64, 11.24, 3.77, -0.08, 0.47, 16.55]} \ No newline at end of file diff --git a/annotations_filtered/-pq4FpNnvcg_filtered.json b/annotations_filtered/-pq4FpNnvcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25017a6c5fd3033e722ed17b756a7876db112533 --- /dev/null +++ b/annotations_filtered/-pq4FpNnvcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 23.68], [24.0, 35.04], [36.0, 36.15], [41.0, 42.15], [43.0, 43.23], [58.0, 60.96], [65.0, 65.94], [69.0, 70.01], [70.0, 74.33], [75.0, 75.88], [77.0, 80.13], [83.0, 84.87], [91.0, 92.8], [94.0, 95.94], [98.0, 99.39], [100.0, 101.65], [105.0, 107.54], [109.0, 113.54], [118.0, 122.99], [124.0, 125.37], [126.0, 129.73], [131.0, 132.75], [136.0, 136.71], [138.0, 138.69], [140.0, 141.18], [145.0, 151.82], [153.0, 154.3], [155.0, 156.42], [158.0, 159.48], [166.0, 167.63], [169.0, 168.84], [169.0, 170.14], [172.0, 172.56], [175.0, 176.99], [178.0, 179.31]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.49, 44.43, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 76.04, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 84.62, 64.07, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.51], ["sonar", 13.25], ["hum", 4.76]], [["mains hum", 21.47], ["fly, housefly", 10.83], ["insect", 10.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.68, 11.04, 0.15, 1.15, 0.23, 2.96, 0.94, 1.01, 4.33, 0.88, 3.13, 1.87, 1.8, 1.94, 1.39, 1.65, 2.54, 4.54, 4.99, 1.37, 3.73, 1.75, 0.71, 0.69, 1.18, 6.82, 1.3, 1.42, 1.48, 1.63, -0.16, 1.14, 0.56, 1.99, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/-qG1Hke8w_8_filtered.json b/annotations_filtered/-qG1Hke8w_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7cc816498ef19c7a2dcaf81e52a7a128dc826d1 --- /dev/null +++ b/annotations_filtered/-qG1Hke8w_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.38], [5.0, 4.89], [9.0, 9.96], [10.0, 21.0], [24.0, 26.52], [28.0, 28.53], [29.0, 32.04], [33.0, 38.01], [40.0, 45.35], [47.0, 47.66]], "keep_status": [true, false, false, true, true, false, true, false, false, false], "silence_prob": [37.8, 0.0, 0.0, 38.4, 35.82, 0.0, 40.06, 36.38, 41.2, 0.0], "audiomae_on_audioset": [[["music", 30.06], ["speech", 23.38], ["sidetone", 7.24]], null, null, [["music", 40.75], ["fly, housefly", 20.07], ["insect", 8.51]], [["music", 54.56], ["rattle (instrument)", 4.07], ["speech", 3.8]], null, [["mosquito", 14.52], ["music", 7.96], ["fly, housefly", 6.21]], [["music", 75.77], ["musical instrument", 3.34], ["hum", 2.19]], [["music", 64.95], ["throbbing", 5.96], ["hum", 4.35]], null], "duration": [2.38, -0.11, 0.96, 11.0, 2.52, 0.53, 3.04, 5.01, 5.35, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/-qGU1hiiJfU_filtered.json b/annotations_filtered/-qGU1hiiJfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..195994a65dd66ad5a7a010eb3275f5a4f71f3a58 --- /dev/null +++ b/annotations_filtered/-qGU1hiiJfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.36], [7.0, 8.34], [10.0, 10.4], [12.0, 12.51], [24.0, 26.91], [30.0, 31.94], [45.0, 46.82], [58.0, 57.97], [58.0, 58.8], [61.0, 62.41], [63.0, 63.96], [71.0, 73.52], [76.0, 76.44], [80.0, 83.25], [85.0, 86.04], [111.0, 111.74], [113.0, 114.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99, 0.0, 82.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 38.33], ["moo", 32.03], ["livestock, farm animals, working animals", 23.09]], null, null, null, null, null], "duration": [0.36, 1.34, 0.4, 0.51, 2.91, 1.94, 1.82, -0.03, 0.8, 1.41, 0.96, 2.52, 0.44, 3.25, 1.04, 0.74, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/-qK58CZslAs_filtered.json b/annotations_filtered/-qK58CZslAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80acac622b5c788769408701034907e5566c24d5 --- /dev/null +++ b/annotations_filtered/-qK58CZslAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.72], [5.0, 7.5], [8.0, 11.62], [12.0, 13.69], [14.0, 21.19], [22.0, 23.08], [24.0, 24.7], [26.0, 26.59], [28.0, 31.26], [34.0, 34.72], [36.0, 36.75], [37.0, 37.91], [39.0, 42.18], [44.0, 45.37], [49.0, 49.23], [50.0, 51.29], [52.0, 54.38], [55.0, 55.7], [57.0, 57.47], [58.0, 60.27], [61.0, 62.46]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.7, 34.14, 38.38, 0.0, 36.52, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 31.64, 0.0, 0.0, 0.0, 37.24, 0.0, 0.0, 80.64, 0.0], "audiomae_on_audioset": [[["speech", 88.4], ["fart", 2.21], ["ping", 0.9]], [["ping", 13.89], ["music", 7.48], ["effects unit", 6.84]], [["ping", 26.84], ["speech", 21.26], ["inside, small room", 6.4]], null, [["noise", 30.24], ["speech", 21.63], ["fart", 5.72]], null, null, null, null, null, null, null, [["speech", 84.55], ["radio", 6.95], ["fart", 2.74]], null, null, null, [["speech", 40.84], ["noise", 21.47], ["radio", 15.87]], null, null, null, null], "duration": [3.72, 2.5, 3.62, 1.69, 7.19, 1.08, 0.7, 0.59, 3.26, 0.72, 0.75, 0.91, 3.18, 1.37, 0.23, 1.29, 2.38, 0.7, 0.47, 2.27, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/-qSADHn4nqw_filtered.json b/annotations_filtered/-qSADHn4nqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0780a002451a01ff80675e358188f3b4ffffc85 --- /dev/null +++ b/annotations_filtered/-qSADHn4nqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [10.0, 10.76], [13.0, 14.2], [14.0, 16.19], [17.0, 18.01], [24.0, 26.06], [28.0, 28.53], [30.0, 30.81], [32.0, 33.03], [33.0, 34.11], [36.0, 50.84], [52.0, 53.43], [54.0, 54.63], [55.0, 58.95], [60.0, 64.89], [68.0, 72.55], [73.0, 73.47], [77.0, 80.62], [81.0, 90.19], [93.0, 104.35], [106.0, 119.1], [140.0, 140.02], [143.0, 144.21], [162.0, 163.16], [164.0, 164.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.51, 0.0, 40.26, 0.0, 0.0, 0.0, 0.0, 37.27, 0.0, 0.0, 53.22, 40.66, 34.02, 0.0, 37.51, 33.15, 35.24, 35.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 62.78], ["musical instrument", 8.9], ["guitar", 7.0]], null, null, null, null, [["music", 58.61], ["speech", 11.5], ["livestock, farm animals, working animals", 3.29]], null, null, null, [["theremin", 46.44], ["music", 39.58], ["musical instrument", 2.42]], [["music", 69.52], ["synthesizer", 4.09], ["throbbing", 3.12]], null, [["music", 46.72], ["didgeridoo", 9.59], ["speech", 8.08]], [["music", 45.15], ["speech", 30.06], ["didgeridoo", 3.36]], [["music", 37.35], ["speech", 27.38], ["tabla", 9.95]], [["foghorn", 32.71], ["music", 20.62], ["speech", 13.06]], null, null, null, null], "duration": [1.34, 0.76, 1.2, 2.19, 1.01, 2.06, 0.53, 0.81, 1.03, 1.11, 14.84, 1.43, 0.63, 3.95, 4.89, 4.55, 0.47, 3.62, 9.19, 11.35, 13.1, 0.02, 1.21, 1.16, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/-qdHE9-8spU_filtered.json b/annotations_filtered/-qdHE9-8spU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6270708b84d60b37c5ceeec6a5a7cfc0de536e2c --- /dev/null +++ b/annotations_filtered/-qdHE9-8spU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.57], [13.0, 17.15], [18.0, 20.66], [21.0, 26.03], [29.0, 30.64], [31.0, 32.26], [34.0, 40.68], [41.0, 43.75], [50.0, 51.16], [54.0, 54.97], [56.0, 57.06], [67.0, 68.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.78, 99.56, 98.73, 99.44, 0.0, 0.0, 99.84, 98.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.57, 4.15, 2.66, 5.03, 1.64, 1.26, 6.68, 2.75, 1.16, 0.97, 1.06, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/-qijwXk_bnk_filtered.json b/annotations_filtered/-qijwXk_bnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74f711393f5085ce03233c98bbaf65eb168b9bbb --- /dev/null +++ b/annotations_filtered/-qijwXk_bnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 47.16], [50.0, 54.11], [55.0, 97.75], [99.0, 100.09], [101.0, 102.22], [103.0, 103.03], [104.0, 105.53], [107.0, 107.91], [109.0, 111.0]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [36.26, 44.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53], "audiomae_on_audioset": [[["music", 80.4], ["soundtrack music", 4.66], ["hum", 3.16]], [["music", 56.14], ["scary music", 5.75], ["harmonic", 2.32]], null, null, null, null, null, null, null], "duration": [9.16, 4.11, 42.75, 1.09, 1.22, 0.03, 1.53, 0.91, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/-qmkhAXmBNc_filtered.json b/annotations_filtered/-qmkhAXmBNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54480387dd1b91fdde702b0c891b88409722c2f3 --- /dev/null +++ b/annotations_filtered/-qmkhAXmBNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [22.0, 23.16], [31.0, 33.15], [48.0, 48.52], [61.0, 64.56], [66.0, 67.53], [71.0, 72.57]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 44.23, 0.0, 45.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.24], ["sidetone", 18.95], ["whale vocalization", 10.48]], null, [["quack", 15.37], ["caw", 8.51], ["crow", 7.29]], null, null], "duration": [0.23, 1.16, 2.15, 0.52, 3.56, 1.53, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/-r_-EnupRXo_filtered.json b/annotations_filtered/-r_-EnupRXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/-r_-EnupRXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/-r_jjQ_idz8_filtered.json b/annotations_filtered/-r_jjQ_idz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..112b52fae3c17f6c2437bfa6590b43770bbfbbe6 --- /dev/null +++ b/annotations_filtered/-r_jjQ_idz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.45], [7.0, 8.06], [9.0, 10.07], [12.0, 12.78], [15.0, 16.24], [17.0, 17.91], [19.0, 19.28], [20.0, 20.58], [21.0, 22.17], [22.0, 22.98], [24.0, 24.7], [29.0, 29.59], [31.0, 32.22], [34.0, 35.28], [36.0, 37.15], [39.0, 39.19], [40.0, 41.44], [42.0, 43.23], [46.0, 46.25], [47.0, 47.85], [49.0, 49.87], [51.0, 52.05], [53.0, 53.97], [55.0, 56.47], [57.0, 60.91], [62.0, 64.22], [73.0, 81.5], [82.0, 86.98], [87.0, 88.43], [91.0, 91.83], [93.0, 93.21], [96.0, 99.93], [101.0, 101.49], [103.0, 103.06], [104.0, 104.84], [105.0, 114.0], [114.0, 114.94], [116.0, 117.05], [117.0, 119.91], [122.0, 123.85], [125.0, 129.93], [131.0, 132.58], [133.0, 134.62], [137.0, 138.32], [139.0, 140.83], [142.0, 146.99], [148.0, 150.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, true, true], "silence_prob": [32.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.56, 32.2, 30.68, 34.65, 0.0, 0.0, 0.0, 36.93, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 36.42, 0.0, 44.66, 0.0, 0.0, 0.0, 0.0, 40.36, 37.43], "audiomae_on_audioset": [[["mains hum", 31.28], ["hum", 23.0], ["speech", 13.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 25.45], ["hum", 19.35], ["fly, housefly", 16.28]], [["music", 72.9], ["trombone", 3.34], ["musical instrument", 3.0]], [["theremin", 54.71], ["music", 31.3], ["musical instrument", 4.68]], [["theremin", 41.98], ["music", 35.85], ["hum", 3.99]], null, null, null, [["music", 42.56], ["gong", 8.72], ["musical instrument", 6.2]], null, null, null, [["music", 35.98], ["hum", 21.75], ["didgeridoo", 10.44]], null, null, [["music", 36.1], ["musical instrument", 12.55], ["speech", 7.01]], null, [["didgeridoo", 58.71], ["music", 19.53], ["hum", 4.79]], null, null, null, null, [["music", 28.47], ["hum", 19.45], ["theremin", 14.16]], [["music", 20.47], ["theremin", 14.15], ["hum", 13.87]]], "duration": [3.45, 1.06, 1.07, 0.78, 1.24, 0.91, 0.28, 0.58, 1.17, 0.98, 0.7, 0.59, 1.22, 1.28, 1.15, 0.19, 1.44, 1.23, 0.25, 0.85, 0.87, 1.05, 0.97, 1.47, 3.91, 2.22, 8.5, 4.98, 1.43, 0.83, 0.21, 3.93, 0.49, 0.06, 0.84, 9.0, 0.94, 1.05, 2.91, 1.85, 4.93, 1.58, 1.62, 1.32, 1.83, 4.99, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/-rebHHoZJSM_filtered.json b/annotations_filtered/-rebHHoZJSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4983902f14715fe7c29c13687b2d93292bfc2284 --- /dev/null +++ b/annotations_filtered/-rebHHoZJSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.86], [15.0, 15.18], [17.0, 17.34], [18.0, 18.55], [20.0, 20.78], [23.0, 23.28], [24.0, 24.54], [43.0, 43.75], [48.0, 48.57], [56.0, 56.0], [57.0, 57.23], [58.0, 58.72], [61.0, 61.74], [65.0, 65.35], [68.0, 68.55], [70.0, 70.68], [78.0, 78.44], [92.0, 93.68], [100.0, 100.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.86, 0.18, 0.34, 0.55, 0.78, 0.28, 0.54, 0.75, 0.57, 0.0, 0.23, 0.72, 0.74, 0.35, 0.55, 0.68, 0.44, 1.68, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/-rkhqMzCUnA_filtered.json b/annotations_filtered/-rkhqMzCUnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0b066052279cd9cadb243588d37b018d267ed7 --- /dev/null +++ b/annotations_filtered/-rkhqMzCUnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.43], [19.0, 20.41], [24.0, 24.48], [26.0, 26.94], [30.0, 30.54], [43.0, 43.43], [45.0, 45.81], [50.0, 49.96], [76.0, 76.33], [90.0, 90.29], [95.0, 99.01], [102.0, 103.22], [104.0, 104.5], [106.0, 107.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["fart", 14.23], ["sidetone", 10.64], ["noise", 9.66]], null, null, null], "duration": [0.34, 0.43, 1.41, 0.48, 0.94, 0.54, 0.43, 0.81, -0.04, 0.33, 0.29, 4.01, 1.22, 0.5, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/-rmALJkEprY_filtered.json b/annotations_filtered/-rmALJkEprY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44671ac1819bd4d287bbe7715e6c41d1db7ab7d7 --- /dev/null +++ b/annotations_filtered/-rmALJkEprY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [5.0, 9.44], [15.0, 26.6], [30.0, 37.0], [48.0, 49.05], [50.0, 51.75], [54.0, 54.9], [57.0, 112.62], [114.0, 116.4], [117.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 59.59, 35.2, 33.44, 0.0, 0.0, 0.0, 0.0, 37.77, 36.89], "audiomae_on_audioset": [null, null, [["music", 43.52], ["theremin", 39.13], ["musical instrument", 3.93]], [["music", 70.1], ["musical instrument", 3.95], ["theremin", 3.89]], null, null, null, null, [["music", 31.77], ["hum", 4.03], ["cowbell", 3.9]], [["music", 19.46], ["speech", 6.42], ["vehicle", 4.35]]], "duration": [1.33, 4.44, 11.6, 7.0, 1.05, 1.75, 0.9, 55.62, 2.4, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/-rq6IBVPcBU_filtered.json b/annotations_filtered/-rq6IBVPcBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f8656a95e05db5401caab1bc77e73d4112bef3f --- /dev/null +++ b/annotations_filtered/-rq6IBVPcBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.03], [21.0, 21.25], [27.0, 29.2], [30.0, 32.02], [33.0, 34.03], [35.0, 38.55], [39.0, 39.8], [44.0, 45.08], [51.0, 66.45], [68.0, 73.94], [74.0, 108.03], [109.0, 116.02], [119.0, 124.85], [127.0, 128.38]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 83.34, 77.36, 0.0, 43.61, 0.0, 0.0, 37.8, 30.31, 0.0, 32.37, 32.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 12.56], ["mosquito", 10.22], ["speech", 8.61]], null, null, [["speech", 69.04], ["radio", 14.7], ["noise", 6.11]], [["music", 62.96], ["speech", 21.19], ["boing", 7.0]], null, [["music", 57.96], ["speech", 15.05], ["synthesizer", 5.22]], [["music", 43.03], ["speech", 18.48], ["throbbing", 4.38]], null], "duration": [0.03, 0.25, 2.2, 2.02, 1.03, 3.55, 0.8, 1.08, 15.45, 5.94, 34.03, 7.02, 5.85, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/-rsImQShehk_filtered.json b/annotations_filtered/-rsImQShehk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46b11c51cfa59e230fb248107e28c98c7ee2148e --- /dev/null +++ b/annotations_filtered/-rsImQShehk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [4.0, 31.78], [33.0, 36.85], [37.0, 36.88], [37.0, 37.44], [37.0, 37.5], [38.0, 38.08], [41.0, 40.86], [42.0, 42.45], [43.0, 47.97], [48.0, 97.09], [101.0, 108.01]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.78, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.43, 0.0, 30.51], "audiomae_on_audioset": [null, [["sheep", 19.58], ["livestock, farm animals, working animals", 17.46], ["cattle, bovinae", 16.0]], null, null, null, null, null, null, null, [["speech", 35.28], ["hum", 19.58], ["music", 9.9]], null, [["throbbing", 37.56], ["hum", 27.33], ["music", 14.82]]], "duration": [0.7, 27.78, 3.85, -0.12, 0.44, 0.5, 0.08, -0.14, 0.45, 4.97, 49.09, 7.01]} \ No newline at end of file diff --git a/annotations_filtered/-sD2jY0KMA8_filtered.json b/annotations_filtered/-sD2jY0KMA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62bc1200a72264af786ad118a1127fe02182c49f --- /dev/null +++ b/annotations_filtered/-sD2jY0KMA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.81], [17.0, 24.04], [26.0, 27.46], [39.0, 39.14], [43.0, 53.23], [57.0, 57.3], [59.0, 59.53], [62.0, 63.61], [64.0, 67.24], [70.0, 71.46], [80.0, 80.69], [83.0, 88.97], [91.0, 100.45], [105.0, 105.88], [112.0, 112.62]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [36.2, 32.0, 0.0, 0.0, 30.2, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 33.01, 30.17, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.96], ["throbbing", 17.24], ["hum", 16.9]], [["music", 62.1], ["throbbing", 10.26], ["hum", 10.04]], null, null, [["music", 44.72], ["didgeridoo", 16.05], ["throbbing", 6.48]], null, null, null, [["didgeridoo", 46.37], ["music", 31.04], ["quack", 2.26]], null, null, [["speech", 36.66], ["throbbing", 14.81], ["music", 10.5]], [["music", 52.55], ["speech", 38.81], ["boing", 4.76]], null, null], "duration": [3.81, 7.04, 1.46, 0.14, 10.23, 0.3, 0.53, 1.61, 3.24, 1.46, 0.69, 5.97, 9.45, 0.88, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/-sJezi3j7O8_filtered.json b/annotations_filtered/-sJezi3j7O8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ddbcd7a19f9c921aeff81ed50e82b6fddaf2c62 --- /dev/null +++ b/annotations_filtered/-sJezi3j7O8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [13.0, 13.95], [16.0, 17.88], [29.0, 29.39], [33.0, 35.33], [36.0, 37.13], [41.0, 41.49], [43.0, 44.52], [66.0, 67.66], [69.0, 73.53], [76.0, 76.69], [77.0, 87.39], [91.0, 110.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 34.04, 41.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 47.45], ["didgeridoo", 24.45], ["speech", 9.39]], [["music", 54.97], ["speech", 8.22], ["synthesizer", 6.54]]], "duration": [0.33, 0.95, 1.88, 0.39, 2.33, 1.13, 0.49, 1.52, 1.66, 4.53, 0.69, 10.39, 19.76]} \ No newline at end of file diff --git a/annotations_filtered/-sYKI4A3uhc_filtered.json b/annotations_filtered/-sYKI4A3uhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d01c5f102cb1711ca3432c29f84f5938599cf08 --- /dev/null +++ b/annotations_filtered/-sYKI4A3uhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [5.0, 6.84], [14.0, 17.61], [21.0, 34.64], [36.0, 47.44], [50.0, 53.13], [56.0, 71.44], [71.0, 85.94], [89.0, 88.57], [89.0, 88.6], [89.0, 98.93], [109.0, 114.17], [122.0, 159.63], [160.0, 160.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.15, 33.13, 31.3, 31.84, 31.66, 31.26, 0.0, 0.0, 30.39, 30.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.28], ["speech", 14.48], ["musical instrument", 6.42]], [["music", 81.71], ["soul music", 2.19], ["independent music", 1.15]], [["music", 86.44], ["singing", 1.1], ["country", 0.95]], [["music", 66.87], ["guitar", 7.5], ["musical instrument", 6.78]], [["music", 78.2], ["synthesizer", 1.9], ["singing", 1.34]], [["music", 79.49], ["singing", 1.19], ["song", 1.05]], null, null, [["music", 73.79], ["singing", 3.6], ["musical instrument", 1.63]], [["music", 54.2], ["funk", 3.07], ["soul music", 2.17]], null, null], "duration": [0.46, 1.84, 3.61, 13.64, 11.44, 3.13, 15.44, 14.94, -0.43, -0.4, 9.93, 5.17, 37.63, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/-sv5DJfslVM_filtered.json b/annotations_filtered/-sv5DJfslVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6645b1f154d892ada6ae35006ed700eafbe8131b --- /dev/null +++ b/annotations_filtered/-sv5DJfslVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.39], [13.0, 14.99], [18.0, 20.58], [21.0, 24.63], [27.0, 29.15], [31.0, 33.76], [35.0, 35.48], [40.0, 41.01], [43.0, 46.72], [48.0, 49.87], [52.0, 52.98], [55.0, 59.64], [61.0, 61.45], [62.0, 67.41], [69.0, 73.23], [75.0, 77.26], [79.0, 79.91], [80.0, 85.68], [87.0, 95.32], [97.0, 101.61], [103.0, 103.72], [108.0, 117.54], [118.0, 121.8]], "keep_status": [true, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.5, 0.0, 44.84, 44.84, 39.55, 44.49, 0.0, 0.0, 98.44, 0.0, 0.0, 61.08, 0.0, 95.09, 98.86, 99.4, 0.0, 69.61, 56.1, 64.86, 0.0, 97.22, 43.85], "audiomae_on_audioset": [[["music", 35.08], ["theremin", 22.74], ["fly, housefly", 7.08]], null, [["music", 49.39], ["musical instrument", 5.5], ["singing bowl", 4.22]], [["music", 56.93], ["ambient music", 4.22], ["synthesizer", 3.69]], [["speech", 26.62], ["hum", 8.18], ["music", 7.88]], [["speech", 32.46], ["sidetone", 11.26], ["tuning fork", 9.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 64.33], ["tuning fork", 8.19], ["chirp tone", 2.88]]], "duration": [4.39, 1.99, 2.58, 3.63, 2.15, 2.76, 0.48, 1.01, 3.72, 1.87, 0.98, 4.64, 0.45, 5.41, 4.23, 2.26, 0.91, 5.68, 8.32, 4.61, 0.72, 9.54, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/-swpG7VRhpQ_filtered.json b/annotations_filtered/-swpG7VRhpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32c4409e990d906f40082ec8ae267c54b2a21696 --- /dev/null +++ b/annotations_filtered/-swpG7VRhpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.77], [4.0, 4.56], [28.0, 29.24], [31.0, 31.5], [33.0, 35.73], [47.0, 47.14], [60.0, 65.64], [67.0, 67.66], [73.0, 73.77], [75.0, 79.54], [80.0, 81.75], [84.0, 86.61], [88.0, 90.05], [90.0, 91.3], [93.0, 94.61], [96.0, 97.55], [99.0, 101.73], [116.0, 116.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 52.05, 0.0, 0.0, 74.29, 0.0, 56.78, 47.43, 0.0, 0.0, 0.0, 35.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 22.3], ["music", 14.65], ["radio", 9.88]], null, null, null, [["music", 20.17], ["throbbing", 19.2], ["hum", 16.37]], null], "duration": [1.77, 0.56, 1.24, 0.5, 2.73, 0.14, 5.64, 0.66, 0.77, 4.54, 1.75, 2.61, 2.05, 1.3, 1.61, 1.55, 2.73, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/-szJznl-3UE_filtered.json b/annotations_filtered/-szJznl-3UE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b8158f5d9971f3fa21cce10135ae9fb29482ba3 --- /dev/null +++ b/annotations_filtered/-szJznl-3UE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.23], [22.0, 22.84], [25.0, 25.95], [29.0, 28.93], [38.0, 38.37], [43.0, 43.56], [57.0, 56.79], [63.0, 63.76], [65.0, 64.98], [68.0, 69.4], [75.0, 75.76], [79.0, 78.81], [79.0, 80.69], [87.0, 88.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.84, 0.95, -0.07, 0.37, 0.56, -0.21, 0.76, -0.02, 1.4, 0.76, -0.19, 1.69, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/-t06SZje8O0_filtered.json b/annotations_filtered/-t06SZje8O0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f534ac2a46aa6371ffdd3be23694d5f4e73e821a --- /dev/null +++ b/annotations_filtered/-t06SZje8O0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.22], [43.0, 47.71], [49.0, 49.0], [49.0, 49.59], [51.0, 72.35]], "keep_status": [true, true, false, false, true], "silence_prob": [30.68, 30.19, 0.0, 0.0, 29.6], "audiomae_on_audioset": [[["music", 57.58], ["thunk", 6.6], ["hum", 5.1]], [["speech", 21.52], ["music", 19.94], ["rumble", 6.61]], null, null, [["speech", 39.86], ["music", 11.03], ["explosion", 5.14]]], "duration": [17.22, 4.71, 0.0, 0.59, 21.35]} \ No newline at end of file diff --git a/annotations_filtered/-tXr3ask1fo_filtered.json b/annotations_filtered/-tXr3ask1fo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..882408398e2718c799cccc73df573b061f4a87a8 --- /dev/null +++ b/annotations_filtered/-tXr3ask1fo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.07], [8.0, 23.03], [24.0, 25.32], [26.0, 25.81], [30.0, 30.42], [34.0, 63.73], [64.0, 75.1], [75.0, 75.96], [77.0, 82.11], [82.0, 107.54]], "keep_status": [false, true, false, false, false, false, false, false, false, false], "silence_prob": [59.59, 40.81, 0.0, 0.0, 0.0, 40.5, 60.98, 0.0, 63.96, 37.2], "audiomae_on_audioset": [null, [["music", 56.31], ["musical instrument", 7.09], ["brass instrument", 5.09]], null, null, null, [["music", 56.31], ["brass instrument", 11.51], ["musical instrument", 7.91]], null, null, null, [["speech", 57.73], ["thunk", 9.14], ["music", 9.03]]], "duration": [4.07, 15.03, 1.32, -0.19, 0.42, 29.73, 11.1, 0.96, 5.11, 25.54]} \ No newline at end of file diff --git a/annotations_filtered/-tuNR-uD_mE_filtered.json b/annotations_filtered/-tuNR-uD_mE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e60203531f0cad45103f8f4386996a36792862f9 --- /dev/null +++ b/annotations_filtered/-tuNR-uD_mE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 52.32], [53.0, 73.28], [77.0, 98.81], [101.0, 121.81]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 40.19, 32.43, 33.13], "audiomae_on_audioset": [null, [["music", 77.19], ["effects unit", 4.34], ["guitar", 2.79]], [["music", 50.71], ["theremin", 29.75], ["musical instrument", 1.94]], [["music", 83.14], ["theremin", 3.36], ["didgeridoo", 2.7]]], "duration": [0.32, 20.28, 21.81, 20.81]} \ No newline at end of file diff --git a/annotations_filtered/-u1uwI5qJ74_filtered.json b/annotations_filtered/-u1uwI5qJ74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..370c09ea768e9c581a33f4bac114df0ee3f6625e --- /dev/null +++ b/annotations_filtered/-u1uwI5qJ74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.03], [15.0, 20.06], [20.0, 21.74], [25.0, 28.71], [32.0, 40.0], [44.0, 52.2], [53.0, 56.64], [74.0, 76.6], [81.0, 82.22], [98.0, 113.51], [118.0, 122.27], [126.0, 133.98], [147.0, 152.02], [152.0, 154.7]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true, false], "silence_prob": [46.79, 35.58, 0.0, 36.31, 33.48, 37.61, 36.2, 32.31, 0.0, 31.81, 32.36, 30.94, 31.87, 54.1], "audiomae_on_audioset": [[["speech", 76.95], ["burping, eructation", 4.68], ["male speech, man speaking", 3.51]], [["speech", 42.5], ["music", 29.1], ["thunk", 3.95]], null, [["music", 67.88], ["synthesizer", 3.22], ["whack, thwack", 2.51]], [["music", 62.57], ["speech", 16.83], ["groan", 5.21]], [["music", 46.6], ["speech", 18.77], ["boing", 11.21]], [["music", 18.98], ["fly, housefly", 8.67], ["speech", 6.46]], [["whack, thwack", 41.58], ["music", 20.14], ["thunk", 11.42]], null, [["music", 43.54], ["speech", 38.88], ["boing", 8.91]], [["music", 11.73], ["theremin", 11.64], ["speech", 10.43]], [["cattle, bovinae", 40.75], ["livestock, farm animals, working animals", 34.61], ["moo", 24.15]], [["music", 28.75], ["mosquito", 17.18], ["shofar", 4.72]], null], "duration": [3.03, 5.06, 1.74, 3.71, 8.0, 8.2, 3.64, 2.6, 1.22, 15.51, 4.27, 7.98, 5.02, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/-uAEWFPmAwU_filtered.json b/annotations_filtered/-uAEWFPmAwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8dbf7fb5b1529de7d4e536d589dec0ef2d4ddb7 --- /dev/null +++ b/annotations_filtered/-uAEWFPmAwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 3.16], [4.0, 4.11], [5.0, 6.83], [7.0, 8.77], [10.0, 10.1], [15.0, 15.67], [17.0, 18.64], [22.0, 25.54], [28.0, 28.11], [30.0, 30.3], [35.0, 36.46], [38.0, 40.59], [50.0, 50.58], [56.0, 57.16], [65.0, 65.92], [69.0, 68.88], [71.0, 71.29], [73.0, 73.31], [79.0, 80.18], [95.0, 95.23], [96.0, 96.26], [112.0, 113.29], [114.0, 114.56], [115.0, 125.34], [128.0, 129.74], [140.0, 141.71], [145.0, 144.95], [145.0, 163.92], [181.0, 195.61], [200.0, 204.23], [205.0, 208.55], [211.0, 210.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0, 31.91, 32.91, 53.1, 78.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 58.24], ["mains hum", 8.51], ["throbbing", 4.76]], null, null, null, [["music", 75.51], ["didgeridoo", 6.36], ["theremin", 4.59]], [["music", 82.0], ["theremin", 1.38], ["musical instrument", 1.37]], null, null, null], "duration": [0.29, 0.16, 0.11, 1.83, 1.77, 0.1, 0.67, 1.64, 3.54, 0.11, 0.3, 1.46, 2.59, 0.58, 1.16, 0.92, -0.12, 0.29, 0.31, 1.18, 0.23, 0.26, 1.29, 0.56, 10.34, 1.74, 1.71, -0.05, 18.92, 14.61, 4.23, 3.55, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/-uPSVWxV6d8_filtered.json b/annotations_filtered/-uPSVWxV6d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da03046e692908f111b6b45ecc97756624245a2f --- /dev/null +++ b/annotations_filtered/-uPSVWxV6d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.99], [7.0, 7.11], [10.0, 10.69], [12.0, 12.73], [14.0, 14.93], [17.0, 17.79], [21.0, 21.76], [22.0, 22.55], [23.0, 23.9], [42.0, 41.89], [42.0, 47.97], [50.0, 53.0], [54.0, 55.81], [57.0, 59.54], [67.0, 68.13], [70.0, 72.45], [79.0, 80.76], [88.0, 89.31], [93.0, 95.96], [99.0, 100.28], [104.0, 104.6], [111.0, 110.94], [120.0, 127.01], [135.0, 136.24], [137.0, 137.69], [139.0, 139.38], [141.0, 141.3], [144.0, 149.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 95.51, 0.0, 63.21, 0.0, 30.54, 0.0, 0.0, 36.73, 0.0, 0.0, 0.0, 39.89, 0.0, 0.0, 0.0, 0.0, 36.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.36], ["animal", 21.56], ["dog", 16.16]], null, null, [["music", 65.08], ["musical instrument", 2.12], ["didgeridoo", 1.73]], null, null, null, [["music", 39.29], ["speech", 9.45], ["cattle, bovinae", 3.79]], null, null, null, null, [["music", 72.51], ["speech", 11.24], ["fart", 1.7]]], "duration": [1.99, 0.11, 0.69, 0.73, 0.93, 0.79, 0.76, 0.55, 0.9, -0.11, 5.97, 3.0, 1.81, 2.54, 1.13, 2.45, 1.76, 1.31, 2.96, 1.28, 0.6, -0.06, 7.01, 1.24, 0.69, 0.38, 0.3, 5.4]} \ No newline at end of file diff --git a/annotations_filtered/-uhpev-dp2M_filtered.json b/annotations_filtered/-uhpev-dp2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f2608e3bf1856a2b1a9e09c4f905221cae58f5 --- /dev/null +++ b/annotations_filtered/-uhpev-dp2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.3], [27.0, 27.68], [32.0, 33.0], [34.0, 36.83], [38.0, 39.82], [40.0, 41.66], [45.0, 45.71], [52.0, 52.37], [54.0, 54.63], [57.0, 57.89], [60.0, 60.25], [62.0, 62.87], [68.0, 69.25], [71.0, 74.07], [75.0, 80.94], [82.0, 85.08], [87.0, 88.26], [91.0, 95.45], [98.0, 100.11], [101.0, 102.84], [106.0, 110.66], [113.0, 114.39], [117.0, 118.17], [121.0, 121.15], [123.0, 124.77], [126.0, 127.13], [128.0, 129.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 62.58, 58.47, 0.0, 53.65, 51.55, 0.0, 57.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.68, 1.0, 2.83, 1.82, 1.66, 0.71, 0.37, 0.63, 0.89, 0.25, 0.87, 1.25, 3.07, 5.94, 3.08, 1.26, 4.45, 2.11, 1.84, 4.66, 1.39, 1.17, 0.15, 1.77, 1.13, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/-ui9TwNrNEw_filtered.json b/annotations_filtered/-ui9TwNrNEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..011a70d1b25650ded0501d7b826aef9572869a98 --- /dev/null +++ b/annotations_filtered/-ui9TwNrNEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 124.44], [126.0, 136.53]], "keep_status": [false, true], "silence_prob": [0.0, 29.52], "audiomae_on_audioset": [null, [["cacophony", 21.86], ["music", 19.57], ["synthesizer", 10.65]]], "duration": [71.44, 10.53]} \ No newline at end of file diff --git a/annotations_filtered/-utei4CzIzc_filtered.json b/annotations_filtered/-utei4CzIzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53046e84553195bfd03cdd199a50cf8e4f7a6651 --- /dev/null +++ b/annotations_filtered/-utei4CzIzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.01], [7.0, 7.96], [8.0, 8.75], [11.0, 10.98], [12.0, 12.23], [13.0, 13.68], [15.0, 15.28], [18.0, 18.3], [19.0, 21.0], [22.0, 22.52], [24.0, 24.56], [28.0, 30.32], [53.0, 54.23], [55.0, 55.81], [63.0, 64.35], [70.0, 70.6], [73.0, 74.55], [76.0, 76.91], [78.0, 78.7], [80.0, 80.67], [82.0, 82.46], [84.0, 84.7], [85.0, 85.23], [86.0, 86.27], [88.0, 88.35], [90.0, 90.78], [92.0, 92.53], [95.0, 95.2], [97.0, 97.61], [100.0, 100.41], [102.0, 102.96], [105.0, 105.58], [107.0, 107.22], [110.0, 115.01], [117.0, 123.15], [124.0, 129.52], [133.0, 154.95], [156.0, 162.26], [165.0, 169.08], [181.0, 182.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.56, 34.21, 36.2, 53.65, 34.29, 46.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.78], ["wind instrument, woodwind instrument", 24.06], ["clarinet", 6.95]], [["music", 52.97], ["wind instrument, woodwind instrument", 20.28], ["musical instrument", 9.73]], [["wind instrument, woodwind instrument", 40.07], ["clarinet", 28.53], ["music", 20.29]], null, [["wind instrument, woodwind instrument", 47.33], ["music", 28.02], ["flute", 5.82]], [["speech", 24.03], ["fart", 4.86], ["crying, sobbing", 4.75]], null], "duration": [2.01, 0.96, 0.75, -0.02, 0.23, 0.68, 0.28, 0.3, 2.0, 0.52, 0.56, 2.32, 1.23, 0.81, 1.35, 0.6, 1.55, 0.91, 0.7, 0.67, 0.46, 0.7, 0.23, 0.27, 0.35, 0.78, 0.53, 0.2, 0.61, 0.41, 0.96, 0.58, 0.22, 5.01, 6.15, 5.52, 21.95, 6.26, 4.08, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/-v-KiIuYkCo_filtered.json b/annotations_filtered/-v-KiIuYkCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce062225a2f57f0e3efb11488b9eaf758957fd50 --- /dev/null +++ b/annotations_filtered/-v-KiIuYkCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.04], [19.0, 20.75], [22.0, 24.97], [26.0, 27.06], [28.0, 29.44], [32.0, 32.02], [34.0, 36.24], [39.0, 39.73], [42.0, 43.58], [45.0, 50.13], [51.0, 51.58], [52.0, 65.58], [66.0, 68.82]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, true, true], "silence_prob": [34.15, 0.0, 35.63, 0.0, 0.0, 0.0, 42.17, 0.0, 0.0, 30.96, 0.0, 31.87, 34.85], "audiomae_on_audioset": [[["fly, housefly", 51.01], ["insect", 31.69], ["bee, wasp, etc.", 7.13]], null, [["speech", 18.01], ["fly, housefly", 12.72], ["insect", 7.94]], null, null, null, [["rain", 13.64], ["rain on surface", 10.88], ["speech", 9.77]], null, null, [["insect", 42.52], ["fly, housefly", 33.37], ["speech", 7.8]], null, [["speech", 23.23], ["livestock, farm animals, working animals", 22.15], ["animal", 12.9]], [["speech", 36.98], ["music", 8.94], ["burping, eructation", 7.46]]], "duration": [10.04, 1.75, 2.97, 1.06, 1.44, 0.02, 2.24, 0.73, 1.58, 5.13, 0.58, 13.58, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/-v8l6cCrf0w_filtered.json b/annotations_filtered/-v8l6cCrf0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa3b761e410d497390fbd37a07c1b7130f4aab08 --- /dev/null +++ b/annotations_filtered/-v8l6cCrf0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 57.48], [58.0, 59.44], [62.0, 63.0], [67.0, 68.66], [69.0, 69.6], [73.0, 84.38]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.78], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 32.38], ["buzz", 16.52], ["vehicle", 16.14]]], "duration": [41.48, 1.44, 1.0, 1.66, 0.6, 11.38]} \ No newline at end of file diff --git a/annotations_filtered/-v93NKIFBBw_filtered.json b/annotations_filtered/-v93NKIFBBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8525386bfb0f5e1bb94a1f0cf781ae41e42c3b0c --- /dev/null +++ b/annotations_filtered/-v93NKIFBBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 38.7], [44.0, 50.87], [54.0, 64.34]], "keep_status": [true, false, false], "silence_prob": [39.54, 37.95, 36.52], "audiomae_on_audioset": [[["fly, housefly", 19.93], ["insect", 11.29], ["bee, wasp, etc.", 10.02]], [["music", 61.73], ["hum", 8.75], ["musical instrument", 4.55]], [["music", 68.29], ["didgeridoo", 14.69], ["musical instrument", 2.12]]], "duration": [3.7, 6.87, 10.34]} \ No newline at end of file diff --git a/annotations_filtered/-vCVptWV5UE_filtered.json b/annotations_filtered/-vCVptWV5UE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..121fc70e519a5c13b035d56a3d812e0de2fd75c3 --- /dev/null +++ b/annotations_filtered/-vCVptWV5UE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.02], [15.0, 15.45], [19.0, 19.47], [20.0, 21.73], [25.0, 26.92], [29.0, 29.44], [31.0, 31.94], [39.0, 39.66], [43.0, 46.8], [48.0, 48.91], [51.0, 52.62], [54.0, 67.02], [69.0, 69.5], [71.0, 71.63], [73.0, 75.46], [78.0, 80.33], [82.0, 82.76], [85.0, 85.16], [86.0, 86.1], [86.0, 86.24], [86.0, 88.75], [89.0, 89.01], [91.0, 91.76], [95.0, 96.57], [106.0, 106.96], [108.0, 109.49], [112.0, 113.04], [120.0, 119.92], [128.0, 128.43]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.55, 0.0, 0.0, 51.28, 0.0, 0.0, 70.72, 64.97, 0.0, 0.0, 0.0, 0.0, 38.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 37.99], ["theremin", 4.98], ["echo", 4.6]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.75], ["radio", 4.15], ["horse", 2.89]], null, null, null, null, null, null, null, null], "duration": [0.02, 0.45, 0.47, 1.73, 1.92, 0.44, 0.94, 0.66, 3.8, 0.91, 1.62, 13.02, 0.5, 0.63, 2.46, 2.33, 0.76, 0.16, 0.1, 0.24, 2.75, 0.01, 0.76, 1.57, 0.96, 1.49, 1.04, -0.08, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/-vT2ztIXioo_filtered.json b/annotations_filtered/-vT2ztIXioo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79feee1c5d56ee51a769e05b3db0001a0ebbe952 --- /dev/null +++ b/annotations_filtered/-vT2ztIXioo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [9.0, 19.43], [20.0, 20.6], [21.0, 21.19], [22.0, 29.27], [30.0, 98.56]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 30.23, 0.0, 0.0, 31.21, 0.0], "audiomae_on_audioset": [null, [["music", 67.68], ["boing", 11.38], ["didgeridoo", 6.31]], null, null, [["fly, housefly", 37.75], ["insect", 32.1], ["mosquito", 14.81]], null], "duration": [0.07, 10.43, 0.6, 0.19, 7.27, 68.56]} \ No newline at end of file diff --git a/annotations_filtered/-v_2hFPseDg_filtered.json b/annotations_filtered/-v_2hFPseDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc12dd00e3e9ba68e5cebf06dbaf66476d378148 --- /dev/null +++ b/annotations_filtered/-v_2hFPseDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.55], [18.0, 18.98], [20.0, 34.1], [40.0, 44.09], [46.0, 56.08], [57.0, 57.89], [59.0, 59.12], [62.0, 69.43], [70.0, 80.96], [82.0, 86.86], [90.0, 93.16], [96.0, 96.53], [97.0, 124.23], [125.0, 130.84], [131.0, 130.94]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 31.88, 28.89, 34.08, 0.0, 0.0, 33.17, 30.2, 28.66, 29.17, 0.0, 28.79, 28.76, 0.0], "audiomae_on_audioset": [null, null, [["speech", 47.47], ["music", 16.04], ["mains hum", 6.52]], [["explosion", 17.51], ["breaking", 16.71], ["bang", 13.64]], [["hum", 37.04], ["mains hum", 35.23], ["speech", 12.31]], null, null, [["hum", 30.68], ["throbbing", 22.07], ["music", 18.0]], [["music", 42.12], ["speech", 15.43], ["throbbing", 7.51]], [["music", 44.72], ["speech", 30.04], ["hum", 3.05]], [["music", 57.6], ["throbbing", 7.58], ["hum", 4.92]], null, [["speech", 29.98], ["music", 19.26], ["explosion", 10.89]], [["music", 39.87], ["hum", 10.26], ["throbbing", 7.56]], null], "duration": [1.55, 0.98, 14.1, 4.09, 10.08, 0.89, 0.12, 7.43, 10.96, 4.86, 3.16, 0.53, 27.23, 5.84, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/-vvxRiJkXAs_filtered.json b/annotations_filtered/-vvxRiJkXAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7b6167bf6ca56ca107ccfdc8ed7d004ac8647f --- /dev/null +++ b/annotations_filtered/-vvxRiJkXAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.21], [18.0, 18.1], [19.0, 22.08], [23.0, 23.62], [25.0, 28.59], [32.0, 32.64], [35.0, 39.14], [39.0, 40.34], [44.0, 46.62], [49.0, 54.45], [57.0, 56.89], [61.0, 60.94], [63.0, 67.1], [71.0, 71.42], [82.0, 87.37], [89.0, 92.92], [93.0, 108.67], [112.0, 123.62], [124.0, 128.21], [133.0, 134.08], [135.0, 135.21], [137.0, 139.4], [140.0, 141.15], [142.0, 144.34], [146.0, 146.08], [148.0, 148.69], [153.0, 155.53]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [42.58, 0.0, 39.94, 0.0, 34.55, 0.0, 40.82, 0.0, 29.62, 31.12, 0.0, 0.0, 33.31, 0.0, 29.18, 30.0, 29.65, 29.57, 28.74, 0.0, 0.0, 44.26, 0.0, 65.55, 0.0, 0.0, 29.48], "audiomae_on_audioset": [[["whale vocalization", 25.1], ["music", 19.63], ["hum", 10.81]], null, [["music", 39.36], ["didgeridoo", 16.38], ["whale vocalization", 7.12]], null, [["music", 56.6], ["theremin", 18.74], ["musical instrument", 5.37]], null, [["music", 53.88], ["synthesizer", 11.89], ["speech", 9.95]], null, [["music", 17.26], ["mosquito", 15.05], ["fly, housefly", 13.02]], [["didgeridoo", 22.68], ["music", 13.56], ["hum", 10.85]], null, null, [["hum", 39.93], ["mains hum", 23.43], ["music", 11.12]], null, [["music", 52.74], ["theremin", 5.49], ["musical instrument", 3.97]], [["didgeridoo", 35.39], ["music", 18.81], ["whip", 10.28]], [["music", 22.41], ["hum", 9.27], ["throbbing", 6.27]], [["music", 24.25], ["hum", 17.12], ["throbbing", 7.91]], [["speech", 51.52], ["music", 31.0], ["sound effect", 1.8]], null, null, [["music", 46.48], ["brass instrument", 19.27], ["trombone", 13.3]], null, null, null, null, [["music", 48.58], ["theremin", 13.6], ["foghorn", 5.09]]], "duration": [2.21, 0.1, 3.08, 0.62, 3.59, 0.64, 4.14, 1.34, 2.62, 5.45, -0.11, -0.06, 4.1, 0.42, 5.37, 3.92, 15.67, 11.62, 4.21, 1.08, 0.21, 2.4, 1.15, 2.34, 0.08, 0.69, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/-w0WPkB3XJ4_filtered.json b/annotations_filtered/-w0WPkB3XJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60ca3f2b795be695e45b1d16bc672cea99f1a81c --- /dev/null +++ b/annotations_filtered/-w0WPkB3XJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 20.16], [23.0, 105.11]], "keep_status": [false, false], "silence_prob": [30.87, 0.0], "audiomae_on_audioset": [[["music", 74.81], ["singing", 3.23], ["reggae", 1.38]], null], "duration": [16.16, 82.11]} \ No newline at end of file diff --git a/annotations_filtered/-w9kof4SQp4_filtered.json b/annotations_filtered/-w9kof4SQp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ccd8ae39eb1fce1f818816c470ac65644dfee0b --- /dev/null +++ b/annotations_filtered/-w9kof4SQp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [16.0, 25.05], [26.0, 26.84], [33.0, 33.18], [38.0, 37.94], [39.0, 39.68], [44.0, 43.73], [45.0, 47.66], [48.0, 49.6], [50.0, 51.95], [52.0, 54.75], [58.0, 68.42], [69.0, 69.36], [71.0, 71.69], [77.0, 78.38], [89.0, 94.68], [95.0, 95.27], [96.0, 98.73], [101.0, 101.34], [105.0, 105.24], [108.0, 113.68], [125.0, 125.64], [139.0, 139.75], [141.0, 140.97], [142.0, 142.35], [169.0, 169.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 34.95, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 40.9, 32.99, 0.0, 0.0, 0.0, 55.25, 0.0, 88.46, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 67.91], ["didgeridoo", 8.55], ["speech", 5.67]], null, null, null, null, null, [["music", 74.48], ["throbbing", 5.84], ["musical instrument", 3.54]], null, null, [["speech", 36.14], ["music", 19.58], ["mains hum", 4.3]], [["speech", 61.82], ["music", 20.1], ["electric shaver, electric razor", 1.74]], null, null, null, null, null, null, null, null, [["music", 18.74], ["boing", 17.05], ["speech", 10.96]], null, null, null, null, null], "duration": [0.56, 9.05, 0.84, 0.18, -0.06, 0.68, -0.27, 2.66, 1.6, 1.95, 2.75, 10.42, 0.36, 0.69, 1.38, 5.68, 0.27, 2.73, 0.34, 0.24, 5.68, 0.64, 0.75, -0.03, 0.35, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/-wI4jJq98tU_filtered.json b/annotations_filtered/-wI4jJq98tU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d706236c266d478c6e0dfbafaa65f05e56fb6e58 --- /dev/null +++ b/annotations_filtered/-wI4jJq98tU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.2], [19.0, 19.77], [21.0, 25.93], [28.0, 31.77], [33.0, 34.11], [35.0, 36.22], [37.0, 37.72], [39.0, 41.81], [42.0, 43.36], [44.0, 44.91], [46.0, 57.77], [78.0, 78.56], [81.0, 81.23], [84.0, 83.89], [89.0, 89.02], [121.0, 124.24]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 46.33, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 30.53, 0.0, 0.0, 0.0, 0.0, 29.57], "audiomae_on_audioset": [null, null, [["hum", 8.63], ["synthesizer", 8.58], ["mains hum", 8.1]], null, null, null, null, null, null, null, [["music", 40.39], ["theremin", 14.54], ["brass instrument", 4.68]], null, null, null, null, [["fly, housefly", 28.25], ["insect", 20.68], ["mosquito", 9.39]]], "duration": [1.2, 0.77, 4.93, 3.77, 1.11, 1.22, 0.72, 2.81, 1.36, 0.91, 11.77, 0.56, 0.23, -0.11, 0.02, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/-wSYsQS2-NU_filtered.json b/annotations_filtered/-wSYsQS2-NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..374f4a17349c21269564ca691744c85b7b5717bc --- /dev/null +++ b/annotations_filtered/-wSYsQS2-NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.43], [9.0, 10.5], [14.0, 14.81], [17.0, 18.15], [19.0, 20.07], [20.0, 21.14], [23.0, 22.98], [24.0, 24.71], [27.0, 31.62], [32.0, 33.47]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["animal", 45.14], ["dog", 11.39], ["domestic animals, pets", 8.8]], null], "duration": [0.43, 1.5, 0.81, 1.15, 1.07, 1.14, -0.02, 0.71, 4.62, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/-wSqiksvdD8_filtered.json b/annotations_filtered/-wSqiksvdD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab87efbc3301c5031078aca5c1d6df5cdff1a68f --- /dev/null +++ b/annotations_filtered/-wSqiksvdD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [2.0, 3.89], [7.0, 11.33], [12.0, 17.47], [18.0, 18.57], [19.0, 19.45], [20.0, 20.44], [23.0, 27.24], [28.0, 28.46], [29.0, 29.57], [31.0, 32.66], [35.0, 35.8], [37.0, 38.48], [39.0, 42.08], [46.0, 47.56], [49.0, 63.0], [66.0, 66.48], [68.0, 69.69], [72.0, 89.31], [90.0, 93.33], [95.0, 108.89], [110.0, 110.86], [111.0, 117.9], [118.0, 119.79], [120.0, 126.87], [128.0, 127.75], [128.0, 128.07], [129.0, 130.79], [133.0, 135.65]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.25, 35.39, 0.0, 0.0, 0.0, 29.37, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 38.45, 0.0, 0.0, 50.86, 65.32, 55.53, 0.0, 49.73, 0.0, 38.93, 0.0, 0.0, 0.0, 70.16], "audiomae_on_audioset": [null, null, [["music", 42.26], ["hum", 20.21], ["mains hum", 8.28]], [["music", 26.21], ["animal", 15.35], ["didgeridoo", 11.52]], null, null, null, [["groan", 10.56], ["livestock, farm animals, working animals", 5.88], ["grunt", 5.42]], null, null, null, null, null, [["whale vocalization", 36.66], ["music", 10.48], ["speech", 7.62]], null, [["speech", 35.81], ["throbbing", 20.34], ["hum", 19.48]], null, null, null, null, null, null, [["hum", 38.96], ["mains hum", 26.78], ["speech", 21.8]], null, [["hum", 42.38], ["mains hum", 35.5], ["speech", 7.21]], null, null, null, null], "duration": [0.48, 1.89, 4.33, 5.47, 0.57, 0.45, 0.44, 4.24, 0.46, 0.57, 1.66, 0.8, 1.48, 3.08, 1.56, 14.0, 0.48, 1.69, 17.31, 3.33, 13.89, 0.86, 6.9, 1.79, 6.87, -0.25, 0.07, 1.79, 2.65]} \ No newline at end of file diff --git a/annotations_filtered/-wX6_qCCnPc_filtered.json b/annotations_filtered/-wX6_qCCnPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1296401ccfe2d30a8fd425360e0e80773fa869e0 --- /dev/null +++ b/annotations_filtered/-wX6_qCCnPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.93], [17.0, 18.37], [19.0, 20.66], [32.0, 34.03], [36.0, 37.2], [38.0, 38.65], [41.0, 45.72], [47.0, 47.83], [48.0, 49.6], [52.0, 60.84], [63.0, 65.01], [71.0, 83.91], [84.0, 87.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [95.09, 0.0, 0.0, 99.97, 0.0, 0.0, 74.13, 0.0, 0.0, 39.83, 57.25, 36.61, 35.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 35.07], ["theremin", 33.65], ["wind instrument, woodwind instrument", 4.87]], null, [["music", 80.81], ["theremin", 1.77], ["throbbing", 1.6]], [["music", 14.77], ["didgeridoo", 13.86], ["speech", 9.58]]], "duration": [9.93, 1.37, 1.66, 2.03, 1.2, 0.65, 4.72, 0.83, 1.6, 8.84, 2.01, 12.91, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/-wc5S8xwxJk_filtered.json b/annotations_filtered/-wc5S8xwxJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c34f6b11ebbe1460d8da7f77369817780a70fc2e --- /dev/null +++ b/annotations_filtered/-wc5S8xwxJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.27], [21.0, 20.82], [22.0, 22.01], [33.0, 33.35], [39.0, 38.64], [42.0, 44.93], [47.0, 47.76]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 56.1], ["musical instrument", 7.26], ["guitar", 6.62]], null], "duration": [0.27, -0.18, 0.01, 0.35, -0.36, 2.93, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/-wci2oycOQA_filtered.json b/annotations_filtered/-wci2oycOQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feb7b59c8ba05a7044a67d7a2c7a6024491b8cbe --- /dev/null +++ b/annotations_filtered/-wci2oycOQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [2.0, 6.71], [9.0, 10.03], [12.0, 47.09], [49.0, 50.11], [51.0, 51.38], [62.0, 77.09]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 30.13], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.51], ["car", 8.27], ["skidding", 7.09]]], "duration": [0.43, 4.71, 1.03, 35.09, 1.11, 0.38, 15.09]} \ No newline at end of file diff --git a/annotations_filtered/-whQdRI7wUQ_filtered.json b/annotations_filtered/-whQdRI7wUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5fe13776c82a00f0601e9a605b27c6e30e49a40 --- /dev/null +++ b/annotations_filtered/-whQdRI7wUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.68], [14.0, 15.35], [19.0, 20.56], [21.0, 23.28], [24.0, 30.15], [31.0, 36.58], [38.0, 64.5], [65.0, 65.64], [67.0, 68.2], [71.0, 75.83], [84.0, 91.89], [92.0, 93.5], [97.0, 98.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [69.74, 0.0, 0.0, 92.48, 59.24, 72.9, 71.14, 0.0, 0.0, 53.47, 32.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 35.36], ["speech", 14.98], ["boing", 6.81]], null, null], "duration": [8.68, 1.35, 1.56, 2.28, 6.15, 5.58, 26.5, 0.64, 1.2, 4.83, 7.89, 1.5, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/-wqnmuzG51c_filtered.json b/annotations_filtered/-wqnmuzG51c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fdceca134ca72aab0e3127d626df527efffaa1f --- /dev/null +++ b/annotations_filtered/-wqnmuzG51c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [8.0, 9.12], [10.0, 10.45], [11.0, 17.44], [19.0, 35.55], [40.0, 40.88], [47.0, 48.54], [49.0, 71.12], [72.0, 74.97], [76.0, 78.19], [84.0, 86.37], [88.0, 96.28], [101.0, 102.49], [104.0, 104.94], [108.0, 108.46], [109.0, 111.59], [123.0, 130.03], [132.0, 135.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 46.19, 39.89, 0.0, 0.0, 66.27, 100.0, 100.0, 97.64, 98.66, 0.0, 0.0, 0.0, 80.82, 52.56, 48.06], "audiomae_on_audioset": [null, null, null, [["music", 48.35], ["speech", 21.86], ["didgeridoo", 4.49]], [["hum", 19.43], ["speech", 18.76], ["music", 12.89]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.83], ["music", 16.56], ["mosquito", 6.34]]], "duration": [1.13, 1.12, 0.45, 6.44, 16.55, 0.88, 1.54, 22.12, 2.97, 2.19, 2.37, 8.28, 1.49, 0.94, 0.46, 2.59, 7.03, 3.7]} \ No newline at end of file diff --git a/annotations_filtered/-x6njs-cGUE_filtered.json b/annotations_filtered/-x6njs-cGUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28a4e818583539282d73383c81a3ac103c38aa7b --- /dev/null +++ b/annotations_filtered/-x6njs-cGUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.89], [8.0, 10.03], [11.0, 13.51], [15.0, 14.94], [16.0, 19.77], [22.0, 23.82], [27.0, 34.86], [36.0, 36.58], [42.0, 44.29], [45.0, 48.49], [51.0, 52.54], [53.0, 53.91], [55.0, 55.8], [57.0, 57.59], [58.0, 62.06], [63.0, 63.8], [65.0, 66.29], [69.0, 69.63], [73.0, 77.23], [80.0, 80.16], [81.0, 83.51], [85.0, 86.0], [86.0, 89.85], [92.0, 99.37], [100.0, 102.54], [105.0, 105.93], [109.0, 109.86], [112.0, 114.3], [118.0, 124.68], [127.0, 128.49], [130.0, 130.71], [131.0, 133.57], [134.0, 136.8], [138.0, 138.99], [142.0, 143.06], [144.0, 145.42], [146.0, 146.38], [147.0, 152.73], [154.0, 154.8], [159.0, 159.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 77.53, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 41.16, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 42.0, 0.0, 35.2, 0.0, 44.66, 81.53, 54.76, 0.0, 0.0, 98.66, 99.93, 0.0, 0.0, 84.25, 46.5, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 64.11], ["telephone", 7.29], ["dial tone", 5.83]], null, null, null, null, null, null, null, null, [["sidetone", 48.66], ["speech", 24.83], ["telephone", 5.4]], null, [["speech", 52.16], ["sidetone", 33.5], ["white noise", 2.82]], null, [["effects unit", 18.83], ["chirp tone", 11.29], ["distortion", 10.28]], null, null, null, null, null, null, null, null, null, [["sidetone", 64.13], ["speech", 3.68], ["whale vocalization", 3.27]], null, null, null, null, null, null, null], "duration": [1.89, 2.03, 2.51, -0.06, 3.77, 1.82, 7.86, 0.58, 2.29, 3.49, 1.54, 0.91, 0.8, 0.59, 4.06, 0.8, 1.29, 0.63, 4.23, 0.16, 2.51, 1.0, 3.85, 7.37, 2.54, 0.93, 0.86, 2.3, 6.68, 1.49, 0.71, 2.57, 2.8, 0.99, 1.06, 1.42, 0.38, 5.73, 0.8, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/-xCS0zZPAoA_filtered.json b/annotations_filtered/-xCS0zZPAoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..791e1944d0ccbe3b7e8d0526512d74d0ad05c591 --- /dev/null +++ b/annotations_filtered/-xCS0zZPAoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 34.91], [39.0, 48.51], [54.0, 62.31], [64.0, 67.59], [96.0, 100.06]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 42.04, 78.21, 82.79, 98.93], "audiomae_on_audioset": [null, [["whale vocalization", 16.08], ["insect", 11.89], ["mosquito", 9.86]], null, null, null], "duration": [-0.09, 9.51, 8.31, 3.59, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/-xQ5nH_-yyQ_filtered.json b/annotations_filtered/-xQ5nH_-yyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20ef0a4d96f37d4839ebf399440636d2041d95b6 --- /dev/null +++ b/annotations_filtered/-xQ5nH_-yyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.9], [5.0, 6.62], [7.0, 8.31], [9.0, 11.85], [12.0, 13.91], [14.0, 17.32], [18.0, 18.67], [19.0, 20.58], [22.0, 23.55], [27.0, 28.51], [30.0, 34.28], [41.0, 43.11], [47.0, 48.47], [63.0, 65.85], [66.0, 68.42], [69.0, 71.98], [74.0, 77.45], [78.0, 79.27], [82.0, 87.91], [89.0, 91.42], [95.0, 97.71], [99.0, 102.12], [103.0, 105.07], [106.0, 108.14], [110.0, 110.54], [111.0, 111.87], [116.0, 121.17], [124.0, 125.22], [129.0, 128.65], [130.0, 130.22], [131.0, 131.45], [132.0, 133.93], [135.0, 136.0], [137.0, 139.4], [141.0, 144.49], [146.0, 147.48], [151.0, 152.79], [157.0, 160.39], [161.0, 162.43], [164.0, 175.34], [177.0, 178.46]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [93.29, 0.0, 0.0, 60.05, 0.0, 35.38, 0.0, 0.0, 0.0, 0.0, 41.7, 69.2, 0.0, 99.88, 36.72, 32.94, 34.21, 0.0, 85.35, 47.01, 84.98, 41.6, 98.51, 99.98, 0.0, 0.0, 36.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 97.33, 0.0, 0.0, 39.72, 0.0, 37.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 20.22], ["speech", 19.0], ["electric shaver, electric razor", 8.45]], null, null, null, null, [["hum", 13.72], ["burping, eructation", 8.23], ["busy signal", 7.8]], null, null, null, [["speech", 36.43], ["groan", 19.37], ["echo", 5.69]], [["speech", 45.65], ["thunk", 16.2], ["inside, small room", 4.63]], [["speech", 62.94], ["speech synthesizer", 11.65], ["dishes, pots, and pans", 3.43]], null, null, [["speech", 32.45], ["sidetone", 24.37], ["chirp tone", 11.68]], null, [["sidetone", 22.85], ["speech", 22.57], ["chirp tone", 21.57]], null, null, null, null, [["sidetone", 47.7], ["whack, thwack", 5.31], ["hum", 4.55]], null, null, null, null, null, null, null, null, null, null, [["music", 39.87], ["hum", 13.95], ["mains hum", 8.69]], null, [["music", 52.79], ["speech", 12.54], ["ambient music", 4.61]], null], "duration": [3.9, 1.62, 1.31, 2.85, 1.91, 3.32, 0.67, 1.58, 1.55, 1.51, 4.28, 2.11, 1.47, 2.85, 2.42, 2.98, 3.45, 1.27, 5.91, 2.42, 2.71, 3.12, 2.07, 2.14, 0.54, 0.87, 5.17, 1.22, -0.35, 0.22, 0.45, 1.93, 1.0, 2.4, 3.49, 1.48, 1.79, 3.39, 1.43, 11.34, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/-xSV3MoacUw_filtered.json b/annotations_filtered/-xSV3MoacUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7c597488a9633470026d4ebc013be84b3c9a15d --- /dev/null +++ b/annotations_filtered/-xSV3MoacUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 31.58], [33.0, 34.03], [37.0, 39.77], [41.0, 41.27], [41.0, 42.65], [43.0, 45.44], [46.0, 48.47], [49.0, 50.25], [56.0, 57.32], [58.0, 60.25], [64.0, 64.62], [67.0, 69.01], [71.0, 71.42], [72.0, 75.3]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [32.49, 0.0, 71.0, 0.0, 0.0, 56.63, 40.41, 0.0, 0.0, 43.98, 0.0, 51.66, 0.0, 34.83], "audiomae_on_audioset": [[["music", 61.55], ["synthesizer", 6.26], ["theremin", 4.34]], null, null, null, null, null, [["speech", 18.36], ["music", 16.27], ["fly, housefly", 13.92]], null, null, [["music", 50.13], ["foghorn", 22.43], ["musical instrument", 8.38]], null, null, null, [["music", 24.19], ["mains hum", 14.74], ["hum", 12.09]]], "duration": [22.58, 1.03, 2.77, 0.27, 1.65, 2.44, 2.47, 1.25, 1.32, 2.25, 0.62, 2.01, 0.42, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/-xTty5scUwM_filtered.json b/annotations_filtered/-xTty5scUwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49b94e30da37573d32805a64af4fa2094a1612e8 --- /dev/null +++ b/annotations_filtered/-xTty5scUwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [4.0, 4.92], [6.0, 5.97], [21.0, 21.66], [25.0, 29.07], [34.0, 34.8], [39.0, 41.45], [42.0, 43.78], [46.0, 46.01], [46.0, 46.8], [52.0, 53.42], [56.0, 56.3], [59.0, 60.56], [77.0, 77.7], [89.0, 89.58], [104.0, 104.35], [106.0, 109.97], [110.0, 113.14], [114.0, 114.61], [115.0, 115.84], [127.0, 126.86], [127.0, 127.85], [129.0, 129.83], [130.0, 130.28], [131.0, 132.51]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.38, 0.0, 36.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.67, 37.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 24.18], ["music", 20.87], ["hum", 11.47]], null, [["didgeridoo", 31.38], ["speech", 19.26], ["music", 9.99]], null, null, null, null, null, null, null, null, null, [["music", 31.72], ["speech", 15.48], ["hum", 7.76]], [["music", 28.19], ["hum", 21.5], ["mains hum", 16.8]], null, null, null, null, null, null, null], "duration": [0.88, 0.92, -0.03, 0.66, 4.07, 0.8, 2.45, 1.78, 0.01, 0.8, 1.42, 0.3, 1.56, 0.7, 0.58, 0.35, 3.97, 3.14, 0.61, 0.84, -0.14, 0.85, 0.83, 0.28, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/-xZKHX91z9I_filtered.json b/annotations_filtered/-xZKHX91z9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b71c36484cbad99e407a43142380e65cc66eef --- /dev/null +++ b/annotations_filtered/-xZKHX91z9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.44], [16.0, 68.22], [69.0, 70.01], [75.0, 76.17], [82.0, 82.46], [88.0, 90.36], [91.0, 101.04], [102.0, 126.6], [131.0, 136.63]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 34.17, 88.64, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 15.49], ["gunshot, gunfire", 9.11], ["burst, pop", 8.01]], null, null], "duration": [4.44, 52.22, 1.01, 1.17, 0.46, 2.36, 10.04, 24.6, 5.63]} \ No newline at end of file diff --git a/annotations_filtered/-y6RPL5v1bU_filtered.json b/annotations_filtered/-y6RPL5v1bU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..002e6ad3616734ed0499ae1fcef73d8e7a859abd --- /dev/null +++ b/annotations_filtered/-y6RPL5v1bU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 22.64], [24.0, 24.63], [25.0, 26.4], [29.0, 29.91], [34.0, 34.06], [37.0, 38.48], [39.0, 40.04], [42.0, 44.46], [46.0, 47.22], [56.0, 56.46], [58.0, 58.72], [60.0, 60.15], [65.0, 66.12], [67.0, 67.1], [75.0, 75.93], [76.0, 76.62], [80.0, 79.73], [84.0, 84.4], [85.0, 85.7], [86.0, 86.34], [87.0, 87.69], [88.0, 88.5], [89.0, 91.25], [92.0, 92.01], [94.0, 95.07], [95.0, 98.15], [100.0, 100.03], [106.0, 114.2], [117.0, 117.29], [121.0, 121.61], [122.0, 122.84], [128.0, 128.01], [131.0, 131.6], [133.0, 135.57], [144.0, 144.27], [147.0, 146.64], [151.0, 150.82], [162.0, 161.74], [163.0, 166.83], [174.0, 174.9], [187.0, 186.73], [190.0, 190.04], [195.0, 195.27]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 64.29, 0.0, 41.93, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.37], ["chop", 27.16], ["fly, housefly", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.62], ["speech", 22.82], ["throbbing", 6.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.64, 0.63, 1.4, 0.91, 0.06, 1.48, 1.04, 2.46, 1.22, 0.46, 0.72, 0.15, 1.12, 0.1, 0.93, 0.62, -0.27, 0.4, 0.7, 0.34, 0.69, 0.5, 2.25, 0.01, 1.07, 3.15, 0.03, 8.2, 0.29, 0.61, 0.84, 0.01, 0.6, 2.57, 0.27, -0.36, -0.18, -0.26, 3.83, 0.9, -0.27, 0.04, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/-yEE_toKFxc_filtered.json b/annotations_filtered/-yEE_toKFxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..346ed4b69ed4b1542cc397250a257b14bcb359d1 --- /dev/null +++ b/annotations_filtered/-yEE_toKFxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.6], [24.0, 36.78], [39.0, 39.95], [43.0, 43.8], [46.0, 56.94], [59.0, 59.71], [63.0, 63.1], [67.0, 68.47], [70.0, 69.92], [72.0, 73.04], [74.0, 75.41], [78.0, 78.44], [80.0, 79.78], [82.0, 83.0], [86.0, 86.71], [97.0, 96.84], [100.0, 101.61], [102.0, 103.45], [105.0, 106.39], [108.0, 109.22], [110.0, 110.83], [112.0, 112.67], [115.0, 115.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.0, 78.89, 0.0, 0.0, 41.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["echo", 51.16], ["music", 21.71], ["effects unit", 4.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.6, 12.78, 0.95, 0.8, 10.94, 0.71, 0.1, 1.47, -0.08, 1.04, 1.41, 0.44, -0.22, 1.0, 0.71, -0.16, 1.61, 1.45, 1.39, 1.22, 0.83, 0.67, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/-yG7Wp5-8EI_filtered.json b/annotations_filtered/-yG7Wp5-8EI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c7abd168377d7ccc5082b59394caa7b2f540b9c --- /dev/null +++ b/annotations_filtered/-yG7Wp5-8EI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 127.53]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [101.53]} \ No newline at end of file diff --git a/annotations_filtered/-yPwW5V4mhI_filtered.json b/annotations_filtered/-yPwW5V4mhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..931cb341f92ed95ad6c74a2fe6dfb6ab7b28da67 --- /dev/null +++ b/annotations_filtered/-yPwW5V4mhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.15], [5.0, 7.3], [10.0, 10.34], [15.0, 17.39], [21.0, 22.98], [27.0, 27.41], [40.0, 41.64], [44.0, 49.15], [52.0, 51.93], [53.0, 53.35], [54.0, 54.78], [56.0, 57.67], [60.0, 62.34], [63.0, 63.85], [66.0, 66.68], [67.0, 66.73], [67.0, 67.64], [68.0, 69.77], [77.0, 77.45], [81.0, 82.39], [91.0, 91.99], [96.0, 102.27], [103.0, 103.92], [106.0, 106.66], [109.0, 109.04], [111.0, 113.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.71, 0.0, 100.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 2.3, 0.34, 2.39, 1.98, 0.41, 1.64, 5.15, -0.07, 0.35, 0.78, 1.67, 2.34, 0.85, 0.68, -0.27, 0.64, 1.77, 0.45, 1.39, 0.99, 6.27, 0.92, 0.66, 0.04, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/-yZVme3ToO8_filtered.json b/annotations_filtered/-yZVme3ToO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b06453cfca74fbc206a65650c75d20b6036d9051 --- /dev/null +++ b/annotations_filtered/-yZVme3ToO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [22.0, 37.05], [40.0, 63.56]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.12, 31.26], "audiomae_on_audioset": [null, [["music", 47.24], ["speech", 22.91], ["clapping", 11.58]], [["music", 88.31], ["didgeridoo", 1.3], ["musical instrument", 1.13]]], "duration": [0.26, 15.05, 23.56]} \ No newline at end of file diff --git a/annotations_filtered/-yvnWPZy1FQ_filtered.json b/annotations_filtered/-yvnWPZy1FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d9ca97f4fba32c145da27731325aab4b41a42ab --- /dev/null +++ b/annotations_filtered/-yvnWPZy1FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.53], [6.0, 7.13], [8.0, 12.51], [15.0, 42.92], [46.0, 46.38], [51.0, 51.36], [52.0, 52.35], [54.0, 54.11], [55.0, 55.49], [56.0, 56.62], [58.0, 69.58], [70.0, 71.15], [73.0, 74.75], [75.0, 78.76], [80.0, 81.94], [83.0, 84.69], [86.0, 88.62], [90.0, 90.15], [92.0, 92.43], [94.0, 94.32], [97.0, 96.85], [98.0, 99.98]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.44, 0.0, 91.3, 40.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 57.64, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 34.84], ["music", 17.62], ["hum", 15.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.53, 1.13, 4.51, 27.92, 0.38, 0.36, 0.35, 0.11, 0.49, 0.62, 11.58, 1.15, 1.75, 3.76, 1.94, 1.69, 2.62, 0.15, 0.43, 0.32, -0.15, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/-yyoLJuNIJU_filtered.json b/annotations_filtered/-yyoLJuNIJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e16ab9050e3876cce66915ce37f69391e4cc0b6 --- /dev/null +++ b/annotations_filtered/-yyoLJuNIJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [13.0, 13.66], [14.0, 13.9], [14.0, 13.98], [15.0, 15.75], [18.0, 21.95], [26.0, 34.94], [37.0, 41.96], [43.0, 43.77], [47.0, 72.64], [75.0, 93.55], [94.0, 94.47], [97.0, 98.44], [103.0, 111.3], [117.0, 117.61], [118.0, 119.16], [122.0, 133.14], [135.0, 139.62], [140.0, 148.63], [155.0, 157.74], [158.0, 161.2], [163.0, 175.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.46, 28.59, 29.09, 0.0, 28.53, 28.45, 0.0, 0.0, 28.56, 0.0, 0.0, 28.75, 28.77, 28.55, 28.32, 29.25, 28.5], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.7], ["foghorn", 9.43], ["speech", 4.88]], [["music", 44.44], ["speech", 28.07], ["whack, thwack", 4.65]], [["music", 69.71], ["breaking", 7.55], ["throbbing", 5.28]], null, [["speech", 60.76], ["vehicle", 10.58], ["music", 6.53]], [["speech", 24.11], ["vehicle", 22.62], ["car", 13.55]], null, null, [["vehicle", 30.25], ["skidding", 21.62], ["car", 17.3]], null, null, [["speech", 25.76], ["music", 23.33], ["vehicle", 16.46]], [["music", 38.34], ["hum", 12.42], ["throbbing", 10.87]], [["vehicle", 46.86], ["car", 22.01], ["speech", 9.6]], [["skidding", 26.75], ["music", 22.25], ["vehicle", 14.44]], [["music", 25.53], ["vehicle", 9.71], ["speech", 7.92]], [["music", 18.89], ["livestock, farm animals, working animals", 18.41], ["cattle, bovinae", 9.71]]], "duration": [0.59, 0.66, -0.1, -0.02, 0.75, 3.95, 8.94, 4.96, 0.77, 25.64, 18.55, 0.47, 1.44, 8.3, 0.61, 1.16, 11.14, 4.62, 8.63, 2.74, 3.2, 12.74]} \ No newline at end of file diff --git a/annotations_filtered/-zAp8NOpVKU_filtered.json b/annotations_filtered/-zAp8NOpVKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..546db2bc4382de8b87d57f8f054961c2e0f47c88 --- /dev/null +++ b/annotations_filtered/-zAp8NOpVKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [10.0, 14.08], [28.0, 30.13], [33.0, 37.07], [43.0, 43.58], [51.0, 56.52], [63.0, 63.37], [71.0, 73.35], [75.0, 75.15], [89.0, 90.15], [108.0, 108.78], [110.0, 114.25]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 48.56, 31.55, 31.34, 0.0, 31.73, 0.0, 33.06, 0.0, 0.0, 0.0, 36.24], "audiomae_on_audioset": [null, [["music", 32.57], ["brass instrument", 24.76], ["clarinet", 7.89]], [["animal", 14.48], ["wild animals", 10.49], ["roaring cats (lions, tigers)", 9.09]], [["music", 72.2], ["electronic music", 5.77], ["techno", 1.58]], null, [["music", 50.07], ["throbbing", 16.52], ["hum", 11.18]], null, [["thunk", 27.45], ["speech", 25.7], ["music", 6.56]], null, null, null, [["music", 56.47], ["speech", 15.2], ["guitar", 5.24]]], "duration": [0.49, 4.08, 2.13, 4.07, 0.58, 5.52, 0.37, 2.35, 0.15, 1.15, 0.78, 4.25]} \ No newline at end of file diff --git a/annotations_filtered/-zIzLRgwdxA_filtered.json b/annotations_filtered/-zIzLRgwdxA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03d8e5376e701b0821f46787e11d87f3208ecc39 --- /dev/null +++ b/annotations_filtered/-zIzLRgwdxA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 21.46], [23.0, 23.57], [24.0, 24.92], [27.0, 27.95], [29.0, 30.67], [34.0, 34.26], [39.0, 40.69], [42.0, 42.33], [45.0, 49.5], [52.0, 52.95], [54.0, 55.36], [56.0, 80.67], [82.0, 83.57]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [35.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.63, 0.0, 0.0, 34.61, 0.0], "audiomae_on_audioset": [[["music", 31.62], ["throbbing", 23.37], ["hum", 13.13]], null, null, null, null, null, null, null, [["speech", 30.85], ["sidetone", 15.1], ["music", 10.98]], null, null, [["speech", 32.37], ["music", 30.0], ["synthesizer", 6.25]], null], "duration": [18.46, 0.57, 0.92, 0.95, 1.67, 0.26, 1.69, 0.33, 4.5, 0.95, 1.36, 24.67, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/-zNnJiwo_5Y_filtered.json b/annotations_filtered/-zNnJiwo_5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d5d03bf4b451dc069f61f96301cb86c533590e --- /dev/null +++ b/annotations_filtered/-zNnJiwo_5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 36.22], [38.0, 39.12], [44.0, 66.19], [68.0, 69.82], [72.0, 72.82], [79.0, 106.56], [109.0, 109.88], [112.0, 113.85]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [30.11, 0.0, 30.18, 0.0, 0.0, 30.43, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.13], ["didgeridoo", 9.52], ["wind instrument, woodwind instrument", 7.95]], null, [["music", 82.77], ["speech", 4.08], ["sampler", 1.59]], null, null, [["music", 74.49], ["psychedelic rock", 3.4], ["musical instrument", 2.66]], null, null], "duration": [2.22, 1.12, 22.19, 1.82, 0.82, 27.56, 0.88, 1.85]} \ No newline at end of file diff --git a/annotations_filtered/-zXmGloh-P8_filtered.json b/annotations_filtered/-zXmGloh-P8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0ccd51dab1b409ba6ee928a7cf2024e69c6e7f7 --- /dev/null +++ b/annotations_filtered/-zXmGloh-P8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 67.26], [69.0, 69.97], [72.0, 72.49], [75.0, 75.15], [78.0, 84.43], [84.0, 84.48], [86.0, 85.97], [88.0, 88.59], [95.0, 97.97], [99.0, 100.04], [102.0, 128.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 98.66, 0.0, 88.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 0.97, 0.49, 0.15, 6.43, 0.48, -0.03, 0.59, 2.97, 1.04, 26.22]} \ No newline at end of file diff --git a/annotations_filtered/-zoOpeF5Yzc_filtered.json b/annotations_filtered/-zoOpeF5Yzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a155382cd7c4c83aa553fc736f989c094c763bb1 --- /dev/null +++ b/annotations_filtered/-zoOpeF5Yzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 33.15], [36.0, 36.31], [39.0, 42.15], [47.0, 48.84], [51.0, 54.9], [57.0, 57.23], [58.0, 59.58], [73.0, 75.41], [77.0, 77.55], [79.0, 79.51], [81.0, 81.14], [81.0, 82.09], [83.0, 84.08], [95.0, 99.03], [100.0, 105.11], [107.0, 109.11], [111.0, 111.52]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.39, 0.0, 52.92, 0.0, 50.86, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 99.68, 100.0, 0.0], "audiomae_on_audioset": [[["music", 38.22], ["theremin", 12.79], ["quack", 5.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.15, 0.31, 3.15, 1.84, 3.9, 0.23, 1.58, 2.41, 0.55, 0.51, 0.14, 1.09, 1.08, 4.03, 5.11, 2.11, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/-zxyN9-P9_c_filtered.json b/annotations_filtered/-zxyN9-P9_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eaa59fb0678da3a293effb047c0d78be28f7910 --- /dev/null +++ b/annotations_filtered/-zxyN9-P9_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [4.0, 4.01], [6.0, 6.3], [13.0, 14.07], [17.0, 25.76], [27.0, 31.87], [35.0, 37.88], [42.0, 42.23], [42.0, 45.18], [45.0, 46.87], [48.0, 52.44], [52.0, 52.71], [53.0, 52.95], [55.0, 57.35], [59.0, 59.64], [60.0, 62.01], [64.0, 64.62], [67.0, 67.42]], "keep_status": [false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.81, 36.19, 31.78, 0.0, 31.87, 0.0, 33.44, 0.0, 0.0, 52.05, 0.0, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 18.62], ["hum", 17.28], ["music", 11.81]], [["music", 12.7], ["hum", 12.45], ["speech", 6.38]], null, [["speech", 52.9], ["animal", 6.25], ["mains hum", 3.64]], null, [["speech", 67.99], ["sidetone", 10.47], ["hum", 7.35]], null, null, null, null, [["speech", 29.31], ["sidetone", 19.96], ["livestock, farm animals, working animals", 7.11]], null, null], "duration": [0.0, 0.01, 0.3, 1.07, 8.76, 4.87, 2.88, 0.23, 3.18, 1.87, 4.44, 0.71, -0.05, 2.35, 0.64, 2.01, 0.62, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/-zya4vJ-kQE_filtered.json b/annotations_filtered/-zya4vJ-kQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83b91865dbd0b91b112be0aca42e20f6c1c41ff9 --- /dev/null +++ b/annotations_filtered/-zya4vJ-kQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.29], [4.0, 4.48], [5.0, 5.07], [36.0, 38.06], [39.0, 39.12], [49.0, 51.78], [62.0, 63.26], [67.0, 68.03], [68.0, 72.28], [74.0, 75.05], [85.0, 85.5], [101.0, 102.98], [116.0, 117.14], [121.0, 122.22], [124.0, 125.46], [129.0, 130.17], [131.0, 132.46], [132.0, 132.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 0.0, 0.0, 93.13, 0.0, 99.44, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.29, 0.48, 0.07, 2.06, 0.12, 2.78, 1.26, 1.03, 4.28, 1.05, 0.5, 1.98, 1.14, 1.22, 1.46, 1.17, 1.46, 0.66]} \ No newline at end of file