diff --git a/annotations_filtered/h-Ss_FvzZcs_filtered.json b/annotations_filtered/h-Ss_FvzZcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c95659d2a7153441a08b6da23933476e6fd2da80 --- /dev/null +++ b/annotations_filtered/h-Ss_FvzZcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.1], [15.0, 28.04], [32.0, 46.94], [48.0, 67.27], [68.0, 74.14], [86.0, 102.95], [105.0, 124.92], [128.0, 133.89], [137.0, 144.56], [145.0, 150.8], [154.0, 155.21], [159.0, 159.24], [170.0, 171.31]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [35.42, 29.9, 30.24, 30.33, 30.32, 30.28, 30.09, 31.38, 33.35, 33.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 42.25], ["music", 35.44], ["quack", 7.12]], [["music", 76.63], ["synthetic singing", 1.57], ["funny music", 1.07]], [["livestock, farm animals, working animals", 36.16], ["music", 17.28], ["speech", 10.9]], [["moo", 31.23], ["cattle, bovinae", 20.38], ["music", 19.61]], [["speech", 22.65], ["music", 22.19], ["cattle, bovinae", 10.22]], [["music", 79.47], ["speech", 7.75], ["boing", 2.26]], [["cattle, bovinae", 52.03], ["moo", 34.41], ["livestock, farm animals, working animals", 11.98]], [["mosquito", 19.12], ["speech", 13.22], ["music", 11.87]], [["music", 31.5], ["speech", 30.62], ["fly, housefly", 10.57]], [["music", 59.16], ["carnatic music", 14.59], ["theremin", 3.22]], null, null, null], "duration": [4.1, 13.04, 14.94, 19.27, 6.14, 16.95, 19.92, 5.89, 7.56, 5.8, 1.21, 0.24, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/h-UqMU-MIig_filtered.json b/annotations_filtered/h-UqMU-MIig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1d3b78e51d7a5548357302ce4de07774bf9e98e --- /dev/null +++ b/annotations_filtered/h-UqMU-MIig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [3.0, 3.94], [5.0, 7.8], [10.0, 11.28], [13.0, 14.54], [17.0, 78.66], [85.0, 95.08], [99.0, 100.11], [100.0, 108.9], [110.0, 111.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 66.15, 0.0, 37.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 66.74], ["explosion", 7.79], ["echo", 3.13]], null], "duration": [0.46, 0.94, 2.8, 1.28, 1.54, 61.66, 10.08, 1.11, 8.9, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/h0i2KfT2SB0_filtered.json b/annotations_filtered/h0i2KfT2SB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bd4a39f5ccc0476f95affacf73d4db388a728dc --- /dev/null +++ b/annotations_filtered/h0i2KfT2SB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.9], [16.0, 16.39], [16.0, 21.0], [24.0, 25.3], [27.0, 28.07], [30.0, 31.18], [32.0, 34.1], [42.0, 43.5], [45.0, 45.37], [48.0, 51.04], [54.0, 56.91], [58.0, 61.16], [61.0, 72.93], [76.0, 76.44], [77.0, 94.15], [95.0, 109.54], [110.0, 109.58], [110.0, 109.61], [113.0, 129.66]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 47.62, 41.52, 50.26, 42.72, 0.0, 33.14, 32.33, 0.0, 0.0, 32.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 24.04], ["music", 23.09], ["throbbing", 10.22]], null, null, [["music", 15.65], ["hum", 11.85], ["speech", 11.17]], [["music", 38.01], ["electronic music", 11.39], ["hum", 11.1]], null, [["hum", 47.09], ["mains hum", 15.08], ["music", 15.05]], null, [["music", 27.1], ["speech", 17.89], ["didgeridoo", 7.98]], [["music", 22.3], ["throbbing", 19.26], ["whack, thwack", 17.18]], null, null, [["music", 58.59], ["didgeridoo", 4.55], ["speech", 3.73]]], "duration": [1.9, 0.39, 5.0, 1.3, 1.07, 1.18, 2.1, 1.5, 0.37, 3.04, 2.91, 3.16, 11.93, 0.44, 17.15, 14.54, -0.42, -0.39, 16.66]} \ No newline at end of file diff --git a/annotations_filtered/h0qWin97VyI_filtered.json b/annotations_filtered/h0qWin97VyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e4a0017c1ae6e3e41ceb3ca415df2c056021410 --- /dev/null +++ b/annotations_filtered/h0qWin97VyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.66], [15.0, 17.58], [18.0, 18.84], [20.0, 21.32], [26.0, 26.43], [35.0, 34.92], [36.0, 39.83], [41.0, 42.33], [44.0, 45.37], [46.0, 48.39], [50.0, 58.45], [59.0, 61.01], [62.0, 65.3], [66.0, 68.82], [69.0, 72.77], [74.0, 78.92], [80.0, 80.84], [81.0, 81.26], [97.0, 97.58], [98.0, 103.18], [106.0, 106.34], [112.0, 113.75], [114.0, 117.34], [118.0, 120.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 99.68, 79.41, 96.17, 94.37, 97.22, 94.81, 98.86, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 70.44, 99.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 2.58, 0.84, 1.32, 0.43, -0.08, 3.83, 1.33, 1.37, 2.39, 8.45, 2.01, 3.3, 2.82, 3.77, 4.92, 0.84, 0.26, 0.58, 5.18, 0.34, 1.75, 3.34, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/h0qniQTX3r8_filtered.json b/annotations_filtered/h0qniQTX3r8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55bba2a99b9a194fe851dbfc9c880ab86b359995 --- /dev/null +++ b/annotations_filtered/h0qniQTX3r8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.45], [46.0, 45.99], [47.0, 73.04], [73.0, 78.19], [81.0, 80.65], [82.0, 86.59], [88.0, 91.18], [93.0, 96.01], [98.0, 98.76], [102.0, 104.57], [105.0, 108.08], [109.0, 123.26], [127.0, 128.83], [130.0, 134.96], [137.0, 142.65], [145.0, 148.88]], "keep_status": [false, false, true, true, false, true, false, false, false, true, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 35.25, 34.54, 0.0, 38.74, 42.11, 54.56, 0.0, 47.16, 92.31, 40.59, 0.0, 47.98, 33.88, 35.38], "audiomae_on_audioset": [null, null, [["hum", 22.25], ["buzz", 14.08], ["music", 12.33]], [["music", 12.52], ["mains hum", 12.33], ["hum", 9.4]], null, [["grunt", 32.61], ["music", 17.54], ["throbbing", 8.97]], [["livestock, farm animals, working animals", 39.8], ["moo", 19.39], ["cattle, bovinae", 18.7]], null, null, [["mains hum", 17.22], ["hum", 12.92], ["bow-wow", 10.71]], null, [["speech", 33.11], ["music", 32.6], ["didgeridoo", 4.01]], null, [["music", 31.24], ["didgeridoo", 12.39], ["speech", 7.23]], [["music", 25.94], ["hum", 19.4], ["mains hum", 11.57]], [["throbbing", 46.64], ["music", 24.96], ["hum", 14.1]]], "duration": [0.45, -0.01, 26.04, 5.19, -0.35, 4.59, 3.18, 3.01, 0.76, 2.57, 3.08, 14.26, 1.83, 4.96, 5.65, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/h0z4HetQWME_filtered.json b/annotations_filtered/h0z4HetQWME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0faf569a53cb55341259f8818320e5e955189ecb --- /dev/null +++ b/annotations_filtered/h0z4HetQWME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.68], [7.0, 8.61], [13.0, 13.12], [15.0, 16.7], [17.0, 17.46], [18.0, 21.25], [22.0, 25.51], [28.0, 27.72], [30.0, 31.4], [33.0, 35.23], [38.0, 40.19], [40.0, 40.27], [40.0, 40.51], [41.0, 41.37], [46.0, 62.53], [68.0, 71.95], [79.0, 79.59], [80.0, 81.09], [84.0, 84.99], [86.0, 86.98], [90.0, 90.32], [91.0, 93.72], [96.0, 96.57], [101.0, 102.39], [103.0, 103.42], [114.0, 114.13], [115.0, 115.52], [118.0, 118.74], [120.0, 120.65], [123.0, 124.09], [125.0, 126.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 76.2, 39.09, 0.0, 0.0, 37.77, 38.67, 0.0, 0.0, 0.0, 33.26, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 59.09], ["effects unit", 14.05], ["distortion", 4.8]], null, null, [["music", 75.79], ["guitar", 8.21], ["musical instrument", 4.77]], [["music", 53.29], ["boing", 10.42], ["sidetone", 7.19]], null, null, null, [["music", 64.77], ["synthesizer", 18.08], ["electronic music", 2.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 1.61, 0.12, 1.7, 0.46, 3.25, 3.51, -0.28, 1.4, 2.23, 2.19, 0.27, 0.51, 0.37, 16.53, 3.95, 0.59, 1.09, 0.99, 0.98, 0.32, 2.72, 0.57, 1.39, 0.42, 0.13, 0.52, 0.74, 0.65, 1.09, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/h1-T9LYq1hI_filtered.json b/annotations_filtered/h1-T9LYq1hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb567b3b4bbe4280ac852ff76e6cb197d7d02fc5 --- /dev/null +++ b/annotations_filtered/h1-T9LYq1hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 65.82]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [62.82]} \ No newline at end of file diff --git a/annotations_filtered/h1F9-NKqDDk_filtered.json b/annotations_filtered/h1F9-NKqDDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09bcfbe2f35739dc85a4699ffcb73bd76a5289ec --- /dev/null +++ b/annotations_filtered/h1F9-NKqDDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [4.0, 21.15], [23.0, 24.39], [25.0, 29.13], [32.0, 32.91], [37.0, 37.5], [38.0, 40.34], [45.0, 45.4], [47.0, 49.05], [52.0, 52.54], [54.0, 56.4], [59.0, 60.74], [68.0, 68.91], [70.0, 70.61], [72.0, 72.5], [74.0, 75.78], [76.0, 76.35], [77.0, 77.82], [80.0, 81.85], [85.0, 85.38], [86.0, 85.78], [88.0, 88.89], [89.0, 93.93], [97.0, 103.23], [105.0, 112.45]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.3, 0.0, 72.16, 0.0, 0.0, 43.9, 0.0, 40.29, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 45.11, 39.25], "audiomae_on_audioset": [null, [["beatboxing", 29.69], ["throbbing", 12.32], ["synthesizer", 12.18]], null, null, null, null, [["sidetone", 45.11], ["speech", 30.51], ["chirp tone", 9.62]], null, [["sine wave", 43.21], ["chirp tone", 39.57], ["speech", 3.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.28], ["theremin", 19.75], ["didgeridoo", 8.21]], [["music", 65.92], ["theremin", 10.77], ["musical instrument", 3.31]], [["music", 46.3], ["musical instrument", 8.35], ["synthesizer", 7.11]]], "duration": [1.48, 17.15, 1.39, 4.13, 0.91, 0.5, 2.34, 0.4, 2.05, 0.54, 2.4, 1.74, 0.91, 0.61, 0.5, 1.78, 0.35, 0.82, 1.85, 0.38, -0.22, 0.89, 4.93, 6.23, 7.45]} \ No newline at end of file diff --git a/annotations_filtered/h1aJoWg4vGo_filtered.json b/annotations_filtered/h1aJoWg4vGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4ead3006c5f7f42ec5b02e3c6b309eb555fd5a --- /dev/null +++ b/annotations_filtered/h1aJoWg4vGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [7.0, 7.79], [11.0, 11.2], [13.0, 13.56], [16.0, 16.56], [18.0, 19.89], [20.0, 21.2], [22.0, 25.03], [26.0, 26.38], [27.0, 28.88], [32.0, 34.4], [36.0, 36.58], [37.0, 37.72], [38.0, 38.79], [39.0, 40.07], [42.0, 42.06], [43.0, 43.88], [49.0, 54.08], [56.0, 57.03], [59.0, 59.64], [60.0, 72.71], [74.0, 75.03], [76.0, 77.79], [80.0, 81.5], [82.0, 83.91], [88.0, 88.35], [89.0, 90.17], [92.0, 92.47], [93.0, 93.55], [94.0, 95.2], [96.0, 96.45], [97.0, 101.34], [102.0, 109.14], [114.0, 114.98], [116.0, 123.13], [125.0, 126.17], [128.0, 127.8], [129.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 99.95, 0.0, 68.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 0.79, 0.2, 0.56, 0.56, 1.89, 1.2, 3.03, 0.38, 1.88, 2.4, 0.58, 0.72, 0.79, 1.07, 0.06, 0.88, 5.08, 1.03, 0.64, 12.71, 1.03, 1.79, 1.5, 1.91, 0.35, 1.17, 0.47, 0.55, 1.2, 0.45, 4.34, 7.14, 0.98, 7.13, 1.17, -0.2, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/h36wtoBcAS8_filtered.json b/annotations_filtered/h36wtoBcAS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3544a14a1c2052bb675d549f19b7819755dbf9ec --- /dev/null +++ b/annotations_filtered/h36wtoBcAS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [4.0, 7.13], [14.0, 14.82], [15.0, 15.58], [21.0, 22.5], [31.0, 30.86], [32.0, 32.41], [33.0, 35.51], [36.0, 37.76], [42.0, 42.09], [44.0, 44.25], [54.0, 54.55], [56.0, 56.67], [58.0, 59.75], [60.0, 62.04], [64.0, 64.18], [66.0, 66.9], [68.0, 68.57], [70.0, 71.22], [72.0, 72.86], [74.0, 75.17], [76.0, 77.5], [80.0, 81.28], [83.0, 83.67], [85.0, 85.08], [86.0, 86.66], [87.0, 88.05], [90.0, 91.57], [92.0, 92.91], [98.0, 99.35], [100.0, 101.19], [101.0, 101.97], [103.0, 103.45], [105.0, 105.09], [107.0, 109.11], [117.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 49.99], ["sidetone", 19.34], ["telephone", 6.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 34.69], ["throbbing", 19.02], ["speech", 14.88]], null], "duration": [0.76, 3.13, 0.82, 0.58, 1.5, -0.14, 0.41, 2.51, 1.76, 0.09, 0.25, 0.55, 0.67, 1.75, 2.04, 0.18, 0.9, 0.57, 1.22, 0.86, 1.17, 1.5, 1.28, 0.67, 0.08, 0.66, 1.05, 1.57, 0.91, 1.35, 1.19, 0.97, 0.45, 0.09, 2.11, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/h3AqOR2Ru1s_filtered.json b/annotations_filtered/h3AqOR2Ru1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51e1c26cd1dc68f1404784f0d332a45e8e091f5f --- /dev/null +++ b/annotations_filtered/h3AqOR2Ru1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.61], [13.0, 13.17], [13.0, 13.22], [14.0, 14.42], [16.0, 17.02], [29.0, 30.3], [31.0, 31.75], [35.0, 38.53], [39.0, 38.58], [41.0, 43.73], [54.0, 54.45], [60.0, 60.61], [63.0, 65.7], [73.0, 82.17], [85.0, 94.46], [98.0, 108.01], [116.0, 124.31], [126.0, 127.89], [131.0, 134.57], [138.0, 137.94], [149.0, 149.3], [153.0, 153.79], [156.0, 155.55], [180.0, 184.55], [193.0, 194.83], [196.0, 200.21], [207.0, 209.22], [213.0, 214.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 0.0, 68.54, 0.0, 0.0, 61.08, 55.89, 45.49, 40.54, 33.53, 0.0, 39.57, 0.0, 0.0, 0.0, 0.0, 35.45, 0.0, 39.38, 36.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 36.74], ["music", 31.03], ["thunk", 11.34]], null, null, null, null, null, null, [["music", 37.88], ["speech", 6.8], ["musical instrument", 3.92]], [["music", 43.81], ["hum", 13.97], ["throbbing", 7.65]], [["whack, thwack", 39.53], ["groan", 24.1], ["music", 15.48]], null, [["music", 45.74], ["synthesizer", 8.64], ["hum", 7.36]], null, null, null, null, [["music", 46.93], ["boing", 14.76], ["speech", 13.02]], null, [["music", 57.5], ["theremin", 6.44], ["synthesizer", 5.54]], [["music", 53.27], ["speech", 7.32], ["quack", 3.24]], null], "duration": [1.61, 0.17, 0.22, 0.42, 1.02, 1.3, 0.75, 3.53, -0.42, 2.73, 0.45, 0.61, 2.7, 9.17, 9.46, 10.01, 8.31, 1.89, 3.57, -0.06, 0.3, 0.79, -0.45, 4.55, 1.83, 4.21, 2.22, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/h3VZ6IRrVlI_filtered.json b/annotations_filtered/h3VZ6IRrVlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..849dcfd775434523b4a3f7caf64ce6938841524c --- /dev/null +++ b/annotations_filtered/h3VZ6IRrVlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.64], [3.0, 8.01], [9.0, 9.58], [14.0, 15.43], [16.0, 17.66], [21.0, 22.11], [23.0, 40.09], [41.0, 44.24], [45.0, 48.68], [50.0, 50.25], [51.0, 51.97], [54.0, 54.94], [56.0, 63.22], [64.0, 64.67], [65.0, 65.42], [66.0, 69.92], [72.0, 72.25], [74.0, 75.66], [76.0, 75.73], [76.0, 75.79], [76.0, 81.9], [82.0, 83.62], [84.0, 87.49], [88.0, 89.55], [90.0, 91.96], [92.0, 92.01], [92.0, 92.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.92, 0.0, 0.0, 0.0, 0.0, 97.92, 94.52, 67.25, 0.0, 0.0, 0.0, 39.72, 0.0, 0.0, 37.4, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 67.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 77.68], ["fart", 1.65], ["noise", 1.44]], null, null, null, null, null, null, null, null, null, null, [["speech", 64.51], ["hum", 4.66], ["whistling", 4.22]], null, null, [["speech", 58.84], ["fart", 26.91], ["inside, small room", 1.14]], null, null, null, null, [["speech", 71.78], ["noise", 12.41], ["radio", 4.88]], null, null, null, null, null, null], "duration": [-0.36, 5.01, 0.58, 1.43, 1.66, 1.11, 17.09, 3.24, 3.68, 0.25, 0.97, 0.94, 7.22, 0.67, 0.42, 3.92, 0.25, 1.66, -0.27, -0.21, 5.9, 1.62, 3.49, 1.55, 1.96, 0.01, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/h3g5B5JhFcY_filtered.json b/annotations_filtered/h3g5B5JhFcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45afd4a0052d04c2779895b24747081132b55143 --- /dev/null +++ b/annotations_filtered/h3g5B5JhFcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 51.21], [66.0, 66.39], [68.0, 67.93], [79.0, 79.69], [83.0, 83.56], [85.0, 86.97], [89.0, 112.78], [113.0, 114.79], [116.0, 133.12], [133.0, 133.24]], "keep_status": [false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 0.0, 39.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 31.38], ["stomach rumble", 12.99], ["animal", 11.51]], null, [["hum", 40.7], ["music", 13.71], ["mains hum", 12.94]], null], "duration": [1.21, 0.39, -0.07, 0.69, 0.56, 1.97, 23.78, 1.79, 17.12, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/h41ylpWhV1I_filtered.json b/annotations_filtered/h41ylpWhV1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50aa29c280ed18eaaa71ab9d5ae010cb63bb46c --- /dev/null +++ b/annotations_filtered/h41ylpWhV1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.71], [33.0, 34.06], [37.0, 89.95], [95.0, 105.92]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.55], "audiomae_on_audioset": [null, null, null, null], "duration": [1.71, 1.06, 52.95, 10.92]} \ No newline at end of file diff --git a/annotations_filtered/h44egWnbrrg_filtered.json b/annotations_filtered/h44egWnbrrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..056102ffbbbab7ca970795ac8947a3e91e46a53b --- /dev/null +++ b/annotations_filtered/h44egWnbrrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.25], [9.0, 9.41], [10.0, 12.55], [14.0, 15.62], [16.0, 17.83], [22.0, 24.02], [26.0, 26.52], [35.0, 37.37], [39.0, 39.65], [41.0, 42.15], [44.0, 46.89], [50.0, 51.98], [55.0, 55.61], [57.0, 57.97], [59.0, 60.93], [64.0, 64.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 67.89, 0.0, 0.0, 58.89, 0.0, 50.76, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 0.41, 2.55, 1.62, 1.83, 2.02, 0.52, 2.37, 0.65, 1.15, 2.89, 1.98, 0.61, 0.97, 1.93, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/h4SMndWj5To_filtered.json b/annotations_filtered/h4SMndWj5To_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2395afc3bde71d979b1671c58653ed28ff87f78b --- /dev/null +++ b/annotations_filtered/h4SMndWj5To_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.87], [19.0, 20.41], [21.0, 60.44], [61.0, 73.11], [91.0, 91.77], [96.0, 111.2]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.73, 0.0, 30.74], "audiomae_on_audioset": [null, null, null, null, null, [["music", 70.19], ["swing music", 7.36], ["brass instrument", 1.7]]], "duration": [0.87, 1.41, 39.44, 12.11, 0.77, 15.2]} \ No newline at end of file diff --git a/annotations_filtered/h4eOGlJpLYg_filtered.json b/annotations_filtered/h4eOGlJpLYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0de4e7533371a6cf9f215ed1ecdd3fa89111472 --- /dev/null +++ b/annotations_filtered/h4eOGlJpLYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [9.0, 10.77], [11.0, 11.74], [13.0, 18.79], [20.0, 22.17], [23.0, 23.45], [25.0, 25.03], [26.0, 26.45], [27.0, 27.41], [28.0, 28.34], [29.0, 28.81], [31.0, 31.4], [32.0, 33.83], [36.0, 36.98], [48.0, 49.35], [51.0, 52.3], [53.0, 53.11], [61.0, 61.21], [63.0, 63.76], [67.0, 68.18], [72.0, 77.72], [83.0, 89.83], [91.0, 93.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 58.47, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.82, 38.84, 34.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.0], ["radio", 6.41], ["explosion", 1.86]], [["animal", 34.25], ["speech", 13.49], ["clip-clop", 13.09]]], "duration": [0.3, 1.77, 0.74, 5.79, 2.17, 0.45, 0.03, 0.45, 0.41, 0.34, -0.19, 0.4, 1.83, 0.98, 1.35, 1.3, 0.11, 0.21, 0.76, 1.18, 5.72, 6.83, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/h4lbn5nDXwY_filtered.json b/annotations_filtered/h4lbn5nDXwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6c57ff8702ccf915473589b2f9877efbec0579d --- /dev/null +++ b/annotations_filtered/h4lbn5nDXwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.85], [10.0, 11.69], [14.0, 14.91], [15.0, 16.04], [17.0, 17.32], [35.0, 46.18], [47.0, 47.09], [53.0, 54.45], [62.0, 63.64], [66.0, 67.07], [89.0, 90.44], [99.0, 100.16], [102.0, 103.69]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 57.01], ["whack, thwack", 3.63], ["mosquito", 2.7]], null, null, null, null, null, null, null], "duration": [0.85, 1.69, 0.91, 1.04, 0.32, 11.18, 0.09, 1.45, 1.64, 1.07, 1.44, 1.16, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/h4u9pO-98ZM_filtered.json b/annotations_filtered/h4u9pO-98ZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b6626a328f5bcf4658d5814b32492caa4b668ac --- /dev/null +++ b/annotations_filtered/h4u9pO-98ZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [6.0, 6.34], [15.0, 15.45], [17.0, 18.28], [19.0, 19.99], [24.0, 24.02], [39.0, 40.54], [43.0, 43.68], [51.0, 52.84], [54.0, 57.08]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 32.41], ["hum", 21.87], ["mains hum", 15.24]]], "duration": [1.31, 0.34, 0.45, 1.28, 0.99, 0.02, 1.54, 0.68, 1.84, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/h52UYfkLhXg_filtered.json b/annotations_filtered/h52UYfkLhXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41bfcc50f93e92f1435fbf60c22de8c19cd36522 --- /dev/null +++ b/annotations_filtered/h52UYfkLhXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.12], [5.0, 5.27], [7.0, 8.63], [19.0, 19.25], [22.0, 22.69], [37.0, 37.32], [45.0, 44.95], [65.0, 65.08], [67.0, 66.77], [69.0, 69.63], [70.0, 71.78], [76.0, 76.69], [78.0, 78.41], [81.0, 81.4], [86.0, 87.59], [102.0, 102.27], [112.0, 111.91], [116.0, 115.74], [117.0, 117.83], [125.0, 125.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.12, 0.27, 1.63, 0.25, 0.69, 0.32, -0.05, 0.08, -0.23, 0.63, 1.78, 0.69, 0.41, 0.4, 1.59, 0.27, -0.09, -0.26, 0.83, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/h55rTtbCy7o_filtered.json b/annotations_filtered/h55rTtbCy7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c6d4ac6af0559b5dd884692fe5f6ad4114e91f5 --- /dev/null +++ b/annotations_filtered/h55rTtbCy7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.91], [6.0, 6.3], [8.0, 8.82], [11.0, 11.65], [15.0, 16.06], [17.0, 17.02], [24.0, 23.99], [25.0, 25.78], [27.0, 28.56], [32.0, 32.36], [33.0, 34.38], [36.0, 52.25], [55.0, 56.02], [76.0, 77.19], [89.0, 89.56], [90.0, 90.95], [93.0, 92.99], [94.0, 95.93], [97.0, 97.41], [98.0, 98.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 0.3, 0.82, 0.65, 1.06, 0.02, -0.01, 0.78, 1.56, 0.36, 1.38, 16.25, 1.02, 1.19, 0.56, 0.95, -0.01, 1.93, 0.41, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/h5KBS20Ke6U_filtered.json b/annotations_filtered/h5KBS20Ke6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dd207567f14a56218383251620149ba6be3f12f --- /dev/null +++ b/annotations_filtered/h5KBS20Ke6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.02], [29.0, 30.08], [32.0, 32.81], [37.0, 37.81], [38.0, 39.55], [41.0, 41.81], [45.0, 48.39], [54.0, 55.61], [56.0, 59.1], [62.0, 62.68], [63.0, 63.54], [81.0, 81.45], [86.0, 87.03], [103.0, 103.06], [104.0, 104.08], [110.0, 110.35], [112.0, 112.28], [113.0, 113.24], [114.0, 123.11], [125.0, 139.97], [143.0, 142.89], [144.0, 145.52]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 0.0, 48.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.94, 44.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 29.16], ["chirp tone", 25.45], ["noise", 8.28]], null, [["sidetone", 30.77], ["speech", 22.99], ["whale vocalization", 9.98]], null, null, null, null, null, null, null, null, null, [["animal", 15.49], ["music", 14.86], ["buzz", 7.42]], [["speech", 10.61], ["crow", 9.88], ["animal", 8.94]], null, null], "duration": [2.02, 1.08, 0.81, 0.81, 1.55, 0.81, 3.39, 1.61, 3.1, 0.68, 0.54, 0.45, 1.03, 0.06, 0.08, 0.35, 0.28, 0.24, 9.11, 14.97, -0.11, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/h5OjSHDUn8c_filtered.json b/annotations_filtered/h5OjSHDUn8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96b454912652b8d5520cb1f7f398cb9489397b16 --- /dev/null +++ b/annotations_filtered/h5OjSHDUn8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 12.92], [14.0, 15.26], [16.0, 16.53], [18.0, 18.84], [21.0, 21.37], [23.0, 24.75], [27.0, 27.92], [34.0, 37.57], [43.0, 44.46], [46.0, 47.14], [54.0, 55.97], [57.0, 58.5], [60.0, 59.93], [64.0, 63.8], [68.0, 68.67], [73.0, 72.87], [80.0, 81.03], [84.0, 84.7], [87.0, 89.01], [94.0, 95.72], [102.0, 108.89], [116.0, 115.79], [116.0, 115.96], [122.0, 122.69], [141.0, 143.24], [149.0, 150.23], [156.0, 157.27], [160.0, 161.64], [164.0, 165.11], [166.0, 168.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 0.0, 98.99, 0.0, 0.0, 0.0, 50.41, 0.0, 0.0, 0.0, 0.0, 40.81], "audiomae_on_audioset": [null, [["applause", 90.09], ["clapping", 1.27], ["eruption", 1.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.73], ["hum", 14.9], ["theremin", 9.43]], null, null, null, null, null, null, null, null, null, null, [["music", 48.89], ["musical instrument", 6.53], ["sidetone", 4.56]]], "duration": [0.5, 7.92, 1.26, 0.53, 0.84, 0.37, 1.75, 0.92, 3.57, 1.46, 1.14, 1.97, 1.5, -0.07, -0.2, 0.67, -0.13, 1.03, 0.7, 2.01, 1.72, 6.89, -0.21, -0.04, 0.69, 2.24, 1.23, 1.27, 1.64, 1.11, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/h5RMM02YE3U_filtered.json b/annotations_filtered/h5RMM02YE3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c048e18dca33e9cac69a4211ba0b2c679aa82d17 --- /dev/null +++ b/annotations_filtered/h5RMM02YE3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [5.0, 7.1], [8.0, 11.42], [12.0, 17.73], [19.0, 43.63], [44.0, 52.47], [54.0, 85.08], [86.0, 87.27], [89.0, 90.41]], "keep_status": [false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 42.37, 53.04, 32.96, 36.65, 34.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 48.89], ["speech", 24.43], ["effects unit", 3.46]], null, [["livestock, farm animals, working animals", 16.51], ["speech", 14.39], ["cattle, bovinae", 10.34]], [["chime", 27.82], ["music", 26.15], ["wind chime", 10.29]], [["music", 30.51], ["brass instrument", 23.0], ["trombone", 10.72]], null, null, null], "duration": [1.26, 2.1, 3.42, 5.73, 24.63, 8.47, 31.08, 1.27, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/h5UGcMYOaaU_filtered.json b/annotations_filtered/h5UGcMYOaaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d201505495f7dbc0d0b34c9d016bc4cd959c71a6 --- /dev/null +++ b/annotations_filtered/h5UGcMYOaaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.78], [6.0, 13.98], [19.0, 19.45], [20.0, 20.93], [22.0, 26.0], [30.0, 30.06], [31.0, 31.23], [33.0, 34.74], [60.0, 60.29], [61.0, 62.02], [77.0, 78.06], [94.0, 97.95], [104.0, 105.02], [108.0, 122.2], [123.0, 122.82], [126.0, 126.15], [127.0, 127.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.28, 0.0, 0.0, 37.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.11, 0.0, 34.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.82], ["smash, crash", 4.99], ["breaking", 4.03]], null, null, [["speech", 27.94], ["music", 23.04], ["didgeridoo", 13.53]], null, null, null, null, null, null, [["snicker", 30.41], ["laughter", 26.11], ["speech", 11.65]], null, [["music", 52.07], ["hum", 13.93], ["throbbing", 13.05]], null, null, null], "duration": [-0.22, 7.98, 0.45, 0.93, 4.0, 0.06, 0.23, 1.74, 0.29, 1.02, 1.06, 3.95, 1.02, 14.2, -0.18, 0.15, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/h5dCFGJp__0_filtered.json b/annotations_filtered/h5dCFGJp__0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..485590f70e10137777923a92e145232657c13a55 --- /dev/null +++ b/annotations_filtered/h5dCFGJp__0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [7.0, 7.05], [8.0, 8.09], [9.0, 9.95], [12.0, 12.45], [13.0, 14.82], [16.0, 17.56], [18.0, 20.88], [22.0, 27.13], [31.0, 33.07], [37.0, 52.0], [52.0, 54.21], [55.0, 59.75], [63.0, 63.42], [68.0, 69.31], [72.0, 72.71], [74.0, 74.34], [77.0, 77.21], [78.0, 79.49], [80.0, 81.43], [82.0, 86.12], [87.0, 94.17], [97.0, 99.12], [100.0, 102.07], [103.0, 102.79], [111.0, 110.96], [112.0, 112.35], [114.0, 114.37], [115.0, 116.75], [117.0, 116.82], [117.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 37.75, 98.01, 99.99, 49.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.99, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 76.12], ["sidetone", 6.68], ["hum", 4.22]], null, null, [["speech", 32.17], ["sine wave", 16.38], ["dial tone", 8.95]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.9], ["fart", 12.51], ["inside, small room", 3.52]], null, null, null, null, null, null, null], "duration": [1.41, 0.05, 0.09, 0.95, 0.45, 1.82, 1.56, 2.88, 5.13, 2.07, 15.0, 2.21, 4.75, 0.42, 1.31, 0.71, 0.34, 0.21, 1.49, 1.43, 4.12, 7.17, 2.12, 2.07, -0.21, -0.04, 0.35, 0.37, 1.75, -0.18, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/h5f5GgqVWes_filtered.json b/annotations_filtered/h5f5GgqVWes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2136c73d253f6c8f41a85dcc97979848129dc876 --- /dev/null +++ b/annotations_filtered/h5f5GgqVWes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [3.0, 3.15], [4.0, 4.94], [6.0, 6.42], [9.0, 9.58], [11.0, 11.11], [13.0, 13.85], [15.0, 17.17], [19.0, 18.71], [24.0, 24.0], [27.0, 27.18], [29.0, 29.54], [30.0, 31.87], [32.0, 33.47], [35.0, 35.4], [38.0, 39.39], [40.0, 42.74], [46.0, 47.09], [50.0, 50.25], [51.0, 53.47], [59.0, 65.5], [66.0, 72.37], [75.0, 75.88], [77.0, 85.23], [87.0, 87.79], [90.0, 91.22], [92.0, 93.87], [98.0, 101.68], [103.0, 104.23], [105.0, 106.49], [110.0, 110.51], [119.0, 118.69], [119.0, 126.37], [128.0, 129.27], [135.0, 152.95], [154.0, 154.47], [156.0, 157.42], [158.0, 159.97], [161.0, 163.21], [165.0, 166.77], [168.0, 168.88], [172.0, 181.6], [185.0, 184.87], [186.0, 187.29]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.43, 0.0, 0.0, 35.45, 36.25, 35.84, 0.0, 40.73, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 0.0, 28.73, 0.0, 29.69, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 42.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 42.9], ["theremin", 8.67], ["didgeridoo", 4.23]], null, null, null, null, null, null, null, null, [["whale vocalization", 55.35], ["hum", 7.65], ["music", 7.25]], null, null, [["speech", 40.57], ["clip-clop", 7.25], ["horse", 6.04]], [["music", 35.22], ["burping, eructation", 13.38], ["hum", 8.14]], [["music", 38.14], ["speech", 26.11], ["sidetone", 6.84]], null, [["music", 61.67], ["speech", 8.9], ["throbbing", 7.37]], null, null, null, null, null, null, null, null, [["gong", 20.22], ["music", 19.82], ["speech", 18.24]], null, [["music", 46.78], ["breaking", 13.87], ["buzz", 4.32]], null, null, null, null, null, null, [["music", 28.27], ["hum", 22.99], ["mains hum", 10.87]], null, null], "duration": [0.3, 0.15, 0.94, 0.42, 0.58, 0.11, 0.85, 2.17, -0.29, 0.0, 0.18, 0.54, 1.87, 1.47, 0.4, 1.39, 2.74, 1.09, 0.25, 2.47, 6.5, 6.37, 0.88, 8.23, 0.79, 1.22, 1.87, 3.68, 1.23, 1.49, 0.51, -0.31, 7.37, 1.27, 17.95, 0.47, 1.42, 1.97, 2.21, 1.77, 0.88, 9.6, -0.13, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/h5jZBcDev1s_filtered.json b/annotations_filtered/h5jZBcDev1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbfdcc5d7c773b332bbe64cff72b745e27216c7e --- /dev/null +++ b/annotations_filtered/h5jZBcDev1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [6.0, 6.45], [7.0, 12.82], [14.0, 22.32], [28.0, 29.94], [40.0, 48.47], [51.0, 56.89], [58.0, 59.98], [61.0, 110.47], [113.0, 121.12], [123.0, 124.5], [126.0, 129.12], [130.0, 131.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.9, 99.97, 0.0, 90.6, 98.44, 0.0, 0.0, 72.01, 0.0, 69.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.45, 5.82, 8.32, 1.94, 8.47, 5.89, 1.98, 49.47, 8.12, 1.5, 3.12, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/h5nhyFFSweU_filtered.json b/annotations_filtered/h5nhyFFSweU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9ce3a4d2250912c428947e574af5366ee7f22fe --- /dev/null +++ b/annotations_filtered/h5nhyFFSweU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [10.0, 11.08], [13.0, 13.26], [14.0, 15.28], [18.0, 19.58], [21.0, 22.05], [23.0, 23.08], [25.0, 25.89], [27.0, 27.72], [28.0, 29.22], [30.0, 30.99], [31.0, 32.88], [35.0, 35.02], [35.0, 36.91], [41.0, 41.91], [43.0, 43.06], [45.0, 46.31], [47.0, 48.03], [50.0, 50.85], [54.0, 54.85], [57.0, 57.69], [60.0, 60.37], [62.0, 68.82], [70.0, 71.0], [71.0, 73.74], [77.0, 81.77], [83.0, 84.75], [87.0, 88.1], [89.0, 89.95], [91.0, 98.85], [101.0, 101.39], [105.0, 105.81], [107.0, 108.19], [112.0, 112.23], [114.0, 115.99], [119.0, 120.26], [129.0, 130.27], [131.0, 132.68], [133.0, 134.15], [135.0, 135.68], [136.0, 137.69], [138.0, 139.55], [141.0, 141.35], [142.0, 143.21], [145.0, 146.26], [147.0, 147.34], [150.0, 150.75], [151.0, 151.88], [153.0, 154.5], [156.0, 160.07], [161.0, 174.48], [176.0, 177.09], [180.0, 180.57], [181.0, 201.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 67.89, 92.48, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 71.43, 0.0, 0.0, 80.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 45.37], ["speech", 16.63], ["radio", 12.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 1.08, 0.26, 1.28, 1.58, 1.05, 0.08, 0.89, 0.72, 1.22, 0.99, 1.88, 0.02, 1.91, 0.91, 0.06, 1.31, 1.03, 0.85, 0.85, 0.69, 0.37, 6.82, 1.0, 2.74, 4.77, 1.75, 1.1, 0.95, 7.85, 0.39, 0.81, 1.19, 0.23, 1.99, 1.26, 1.27, 1.68, 1.15, 0.68, 1.69, 1.55, 0.35, 1.21, 1.26, 0.34, 0.75, 0.88, 1.5, 4.07, 13.48, 1.09, 0.57, 20.92]} \ No newline at end of file diff --git a/annotations_filtered/h6iHbAju1cI_filtered.json b/annotations_filtered/h6iHbAju1cI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5417cea2f3cbf4ad69e90f6730cb4aa09cb4dc --- /dev/null +++ b/annotations_filtered/h6iHbAju1cI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.59], [19.0, 20.63], [22.0, 35.29], [54.0, 54.48], [55.0, 57.0], [58.0, 58.38], [79.0, 82.22], [83.0, 85.13], [86.0, 86.63]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [34.4, 0.0, 30.86, 0.0, 99.97, 0.0, 30.75, 98.51, 0.0], "audiomae_on_audioset": [[["music", 39.17], ["speech", 34.89], ["sidetone", 4.09]], null, [["music", 71.91], ["throbbing", 7.47], ["smash, crash", 3.99]], null, null, null, [["cattle, bovinae", 33.1], ["moo", 22.97], ["livestock, farm animals, working animals", 22.9]], null, null], "duration": [3.59, 1.63, 13.29, 0.48, 2.0, 0.38, 3.22, 2.13, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/h7CCnLwD2MY_filtered.json b/annotations_filtered/h7CCnLwD2MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a91489a954ff96d7eb9cb185e483b68cc556ead --- /dev/null +++ b/annotations_filtered/h7CCnLwD2MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.69], [23.0, 28.8], [30.0, 30.74], [35.0, 35.58], [42.0, 43.28], [46.0, 46.77], [49.0, 49.01], [54.0, 54.24], [59.0, 61.18], [64.0, 64.61], [80.0, 82.0], [93.0, 94.02], [104.0, 105.24], [111.0, 111.64], [119.0, 119.48], [121.0, 122.89], [124.0, 125.32]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.28, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 71.36], ["speech", 6.46], ["sidetone", 4.72]], null, null, null, null, null, null, [["music", 37.04], ["hum", 16.07], ["speech", 11.15]], null, null, null, null, null, null, null, null], "duration": [-0.31, 5.8, 0.74, 0.58, 1.28, 0.77, 0.01, 0.24, 2.18, 0.61, 2.0, 1.02, 1.24, 0.64, 0.48, 1.89, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/h7NG9ZEfyKo_filtered.json b/annotations_filtered/h7NG9ZEfyKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/h7NG9ZEfyKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/h7ZUKB_zYQ0_filtered.json b/annotations_filtered/h7ZUKB_zYQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6447a40526001aacce22265aa69217c6468cad26 --- /dev/null +++ b/annotations_filtered/h7ZUKB_zYQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [8.0, 13.34], [15.0, 14.91], [18.0, 21.66], [22.0, 24.22], [34.0, 36.78], [37.0, 38.1], [41.0, 43.48], [45.0, 45.79], [47.0, 49.42], [55.0, 57.59], [85.0, 85.95], [90.0, 93.23], [94.0, 98.39], [105.0, 106.1], [113.0, 115.2], [117.0, 118.35], [120.0, 120.45]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 36.11, 0.0, 33.37, 62.68, 58.47, 0.0, 64.63, 0.0, 49.64, 35.47, 0.0, 40.52, 69.2, 0.0, 43.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 29.2], ["whale vocalization", 13.55], ["speech", 10.12]], null, [["music", 60.05], ["theremin", 12.25], ["synthesizer", 5.57]], null, null, null, null, null, [["music", 49.07], ["didgeridoo", 8.61], ["theremin", 7.96]], [["speech", 31.37], ["vehicle", 11.38], ["field recording", 7.32]], null, [["music", 45.23], ["foghorn", 9.39], ["theremin", 6.1]], null, null, [["speech", 36.54], ["hum", 11.3], ["telephone", 8.46]], null, null], "duration": [0.54, 5.34, -0.09, 3.66, 2.22, 2.78, 1.1, 2.48, 0.79, 2.42, 2.59, 0.95, 3.23, 4.39, 1.1, 2.2, 1.35, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/h7wEE6Yx7IQ_filtered.json b/annotations_filtered/h7wEE6Yx7IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889daba38a84327fd064e4cc73a42844bbe77cea --- /dev/null +++ b/annotations_filtered/h7wEE6Yx7IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.6], [9.0, 55.9], [56.0, 59.49], [61.0, 62.06], [64.0, 65.74], [67.0, 67.41], [68.0, 69.55], [72.0, 86.73], [88.0, 89.5], [92.0, 93.73], [95.0, 96.92], [99.0, 107.91], [110.0, 111.21], [113.0, 114.34], [115.0, 117.9], [119.0, 127.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.98, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 41.4, 35.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.69], ["creak", 9.08], ["cattle, bovinae", 5.22]], [["speech", 78.65], ["whale vocalization", 4.36], ["didgeridoo", 2.3]]], "duration": [5.6, 46.9, 3.49, 1.06, 1.74, 0.41, 1.55, 14.73, 1.5, 1.73, 1.92, 8.91, 1.21, 1.34, 2.9, 8.2]} \ No newline at end of file diff --git a/annotations_filtered/h8E3sSTc11E_filtered.json b/annotations_filtered/h8E3sSTc11E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47f43a5b7d168b93b14b414986b02d9d423791d1 --- /dev/null +++ b/annotations_filtered/h8E3sSTc11E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 78.78], [80.0, 91.84]], "keep_status": [false, false], "silence_prob": [80.11, 47.62], "audiomae_on_audioset": [null, [["music", 63.35], ["musical instrument", 6.06], ["synthesizer", 5.07]]], "duration": [3.78, 11.84]} \ No newline at end of file diff --git a/annotations_filtered/h8Rxb-9snJQ_filtered.json b/annotations_filtered/h8Rxb-9snJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c85a18809aa38da4ce1c46f7f654f330d6fb1b84 --- /dev/null +++ b/annotations_filtered/h8Rxb-9snJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.87], [6.0, 8.48], [9.0, 10.13], [12.0, 13.86], [15.0, 19.57], [21.0, 22.74], [24.0, 26.43], [28.0, 28.75], [30.0, 31.72], [33.0, 33.37], [34.0, 36.15], [37.0, 38.65], [39.0, 40.69], [42.0, 43.26], [47.0, 47.12], [49.0, 49.5], [52.0, 52.98], [54.0, 55.36], [56.0, 56.61], [58.0, 58.45], [60.0, 60.03], [62.0, 61.75], [64.0, 66.21], [70.0, 72.17], [74.0, 74.01], [74.0, 74.34], [78.0, 82.68], [84.0, 87.94], [93.0, 94.36], [95.0, 96.89], [99.0, 99.93], [101.0, 101.65], [102.0, 105.97], [113.0, 115.5], [119.0, 122.64], [124.0, 125.69], [127.0, 128.63]], "keep_status": [true, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, true, true, true, false, false], "silence_prob": [34.1, 33.0, 0.0, 0.0, 38.23, 0.0, 37.02, 0.0, 0.0, 0.0, 35.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 31.84, 0.0, 0.0, 35.68, 36.89, 0.0, 0.0, 0.0, 0.0, 33.12, 41.64, 36.11, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 32.54], ["music", 15.58], ["hum", 9.35]], [["speech", 65.18], ["music", 12.02], ["throbbing", 7.75]], null, null, [["fly, housefly", 23.16], ["bee, wasp, etc.", 18.88], ["throbbing", 14.45]], null, [["throbbing", 24.22], ["hum", 23.67], ["music", 20.48]], null, null, null, [["speech", 14.62], ["music", 11.39], ["fly, housefly", 8.61]], null, null, null, null, null, null, null, null, null, null, null, [["music", 46.45], ["hum", 9.7], ["mains hum", 9.21]], [["fly, housefly", 53.61], ["mosquito", 16.98], ["insect", 16.62]], null, null, [["hum", 26.72], ["throbbing", 21.24], ["music", 13.32]], [["music", 33.06], ["didgeridoo", 14.58], ["throbbing", 8.44]], null, null, null, null, [["speech", 38.21], ["hum", 12.64], ["bee, wasp, etc.", 9.93]], [["fly, housefly", 23.38], ["bee, wasp, etc.", 18.43], ["insect", 12.3]], [["throbbing", 20.62], ["hum", 11.72], ["music", 7.99]], null, null], "duration": [2.87, 2.48, 1.13, 1.86, 4.57, 1.74, 2.43, 0.75, 1.72, 0.37, 2.15, 1.65, 1.69, 1.26, 0.12, 0.5, 0.98, 1.36, 0.61, 0.45, 0.03, -0.25, 2.21, 2.17, 0.01, 0.34, 4.68, 3.94, 1.36, 1.89, 0.93, 0.65, 3.97, 2.5, 3.64, 1.69, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/h8c0Q6aqZG8_filtered.json b/annotations_filtered/h8c0Q6aqZG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..511c79d3d3169a5742ae321510b66be6225d3a93 --- /dev/null +++ b/annotations_filtered/h8c0Q6aqZG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [10.0, 10.29], [13.0, 14.74], [15.0, 15.74], [19.0, 19.47], [21.0, 22.0], [23.0, 23.8], [26.0, 26.81], [28.0, 29.17], [30.0, 31.09], [32.0, 31.77], [33.0, 33.83], [34.0, 35.11], [36.0, 37.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.29, 1.74, 0.74, 0.47, 1.0, 0.8, 0.81, 1.17, 1.09, -0.23, 0.83, 1.11, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/h8m69o_1PoQ_filtered.json b/annotations_filtered/h8m69o_1PoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7f153bceaa04262152e9476bd5eea3ee149c4e --- /dev/null +++ b/annotations_filtered/h8m69o_1PoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.58], [13.0, 15.45], [17.0, 27.3], [29.0, 35.83], [37.0, 37.83], [39.0, 39.53], [41.0, 44.73], [45.0, 53.25], [69.0, 72.72], [74.0, 85.6], [86.0, 86.26], [89.0, 97.8], [100.0, 101.11], [103.0, 105.63], [111.0, 113.44], [114.0, 117.8], [119.0, 120.55], [126.0, 125.83]], "keep_status": [false, true, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.51, 31.88, 32.91, 36.79, 0.0, 0.0, 38.36, 49.78, 61.67, 59.77, 0.0, 73.51, 0.0, 61.18, 64.29, 66.15, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.88], ["mains hum", 11.68], ["hum", 9.9]], [["music", 37.75], ["mains hum", 18.77], ["hum", 12.07]], [["music", 67.77], ["speech", 12.72], ["hum", 2.04]], [["music", 54.03], ["speech", 6.09], ["hum", 5.06]], null, null, [["music", 52.02], ["foghorn", 6.22], ["theremin", 5.75]], [["music", 23.49], ["speech", 17.16], ["didgeridoo", 16.32]], null, null, null, null, null, null, null, null, null, null], "duration": [8.58, 2.45, 10.3, 6.83, 0.83, 0.53, 3.73, 8.25, 3.72, 11.6, 0.26, 8.8, 1.11, 2.63, 2.44, 3.8, 1.55, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/h8wzJimC5Zc_filtered.json b/annotations_filtered/h8wzJimC5Zc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14e79bfa9bcb37ae34f81329bedaaf114b7b5fa1 --- /dev/null +++ b/annotations_filtered/h8wzJimC5Zc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.37], [19.0, 55.78], [57.0, 59.48], [62.0, 75.64], [77.0, 78.54], [80.0, 81.7], [83.0, 84.99]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.4, 37.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.5], ["hum", 28.14], ["mains hum", 13.88]], null, null, null], "duration": [1.37, 36.78, 2.48, 13.64, 1.54, 1.7, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/h9GHe5K0kOI_filtered.json b/annotations_filtered/h9GHe5K0kOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc2c046969f876254c71d61106efd3e1443ed2f --- /dev/null +++ b/annotations_filtered/h9GHe5K0kOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [8.0, 7.89], [16.0, 16.6], [17.0, 17.64], [26.0, 29.49], [34.0, 34.92], [36.0, 36.32], [37.0, 37.47], [49.0, 50.36], [68.0, 70.77], [84.0, 83.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, -0.11, 0.6, 0.64, 3.49, 0.92, 0.32, 0.47, 1.36, 2.77, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/h9Rb7mT3juI_filtered.json b/annotations_filtered/h9Rb7mT3juI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70c4310717fa0de124af69f55d8cc0dc4210695a --- /dev/null +++ b/annotations_filtered/h9Rb7mT3juI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.43], [8.0, 8.26], [11.0, 27.08], [28.0, 28.68], [30.0, 62.24], [65.0, 93.73], [97.0, 124.06], [125.0, 136.38], [137.0, 173.43], [174.0, 173.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.05, 0.0, 34.77, 0.0, 0.0, 35.11, 52.33, 38.58, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.27], ["theremin", 9.11], ["didgeridoo", 3.11]], null, [["livestock, farm animals, working animals", 46.24], ["cattle, bovinae", 23.24], ["moo", 15.97]], null, null, [["music", 66.27], ["didgeridoo", 5.39], ["throbbing", 3.77]], null, [["mains hum", 49.95], ["hum", 31.62], ["buzz", 5.56]], null, null], "duration": [3.43, 0.26, 16.08, 0.68, 32.24, 28.73, 27.06, 11.38, 36.43, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/h9WDm1k4Hz4_filtered.json b/annotations_filtered/h9WDm1k4Hz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1181efcf2eae0326c5bcfe0ee3aaa79eff5a9540 --- /dev/null +++ b/annotations_filtered/h9WDm1k4Hz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 25.57], [28.0, 29.76], [31.0, 32.9], [35.0, 36.9], [39.0, 45.25], [46.0, 51.95], [52.0, 56.61], [58.0, 60.76], [62.0, 64.94], [66.0, 66.11], [67.0, 72.67], [73.0, 77.97], [79.0, 82.85], [84.0, 87.3], [90.0, 93.04], [95.0, 97.11], [99.0, 100.89], [102.0, 111.0], [112.0, 120.12], [121.0, 122.32], [123.0, 124.93], [126.0, 127.67], [129.0, 129.71], [132.0, 134.42], [136.0, 141.72], [143.0, 164.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.89, 0.0, 0.0, 0.0, 99.99, 99.84, 55.04, 100.0, 100.0, 0.0, 99.98, 100.0, 98.66, 65.91, 55.74, 100.0, 0.0, 100.0, 99.92, 0.0, 0.0, 0.0, 0.0, 100.0, 81.53, 92.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.57, 1.76, 1.9, 1.9, 6.25, 5.95, 4.61, 2.76, 2.94, 0.11, 5.67, 4.97, 3.85, 3.3, 3.04, 2.11, 1.89, 9.0, 8.12, 1.32, 1.93, 1.67, 0.71, 2.42, 5.72, 21.17]} \ No newline at end of file diff --git a/annotations_filtered/h9jsnAD4aNw_filtered.json b/annotations_filtered/h9jsnAD4aNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d1563f5f950a0d8f7eae7c56a52c61b940a848 --- /dev/null +++ b/annotations_filtered/h9jsnAD4aNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.08], [12.0, 12.95], [23.0, 27.85], [30.0, 31.89], [32.0, 32.46], [41.0, 41.84], [49.0, 48.91], [54.0, 54.01], [58.0, 59.68], [62.0, 68.12], [69.0, 72.3], [73.0, 73.75], [75.0, 75.42], [87.0, 88.62], [96.0, 96.01], [102.0, 102.07], [103.0, 103.2], [104.0, 104.36], [111.0, 110.98]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [30.5, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 34.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 21.96], ["throbbing", 13.23], ["electronic music", 7.4]], null, [["cattle, bovinae", 24.37], ["moo", 21.76], ["livestock, farm animals, working animals", 14.97]], null, null, null, null, null, null, [["throbbing", 10.51], ["music", 9.35], ["didgeridoo", 7.24]], [["fly, housefly", 26.36], ["cattle, bovinae", 11.46], ["insect", 10.06]], null, null, null, null, null, null, null, null], "duration": [8.08, 0.95, 4.85, 1.89, 0.46, 0.84, -0.09, 0.01, 1.68, 6.12, 3.3, 0.75, 0.42, 1.62, 0.01, 0.07, 0.2, 0.36, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/hA063IaOHyQ_filtered.json b/annotations_filtered/hA063IaOHyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a91809a6080cfecff724544566841c917923a2d4 --- /dev/null +++ b/annotations_filtered/hA063IaOHyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [5.0, 7.69], [10.0, 10.52], [15.0, 14.99], [29.0, 29.93], [33.0, 38.48], [49.0, 49.4], [50.0, 50.48], [59.0, 62.31], [67.0, 68.34], [77.0, 81.92], [86.0, 87.39], [94.0, 94.41], [94.0, 96.01], [100.0, 100.55], [105.0, 105.14], [110.0, 113.39], [121.0, 121.29], [129.0, 129.64], [133.0, 134.1]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.14, 0.0, 0.0, 0.0, 39.25, 0.0, 0.0, 99.65, 0.0, 90.78, 0.0, 0.0, 70.86, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.17], ["timpani", 8.42], ["foghorn", 7.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 2.69, 0.52, -0.01, 0.93, 5.48, 0.4, 0.48, 3.31, 1.34, 4.92, 1.39, 0.41, 2.01, 0.55, 0.14, 3.39, 0.29, 0.64, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/hA0OlCQLC0Q_filtered.json b/annotations_filtered/hA0OlCQLC0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f513b3ef0c0cfda938899396a8b1dc0cd001547 --- /dev/null +++ b/annotations_filtered/hA0OlCQLC0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 75.3]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [49.3]} \ No newline at end of file diff --git a/annotations_filtered/hA1BikUzBKc_filtered.json b/annotations_filtered/hA1BikUzBKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88d3fdedb3a146cc7a5a34d83ae27c2dc5e980af --- /dev/null +++ b/annotations_filtered/hA1BikUzBKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.87], [11.0, 10.61], [13.0, 13.02], [19.0, 19.4], [21.0, 21.14], [23.0, 23.09], [25.0, 26.22], [32.0, 32.34], [38.0, 38.91], [40.0, 40.0], [45.0, 60.69], [65.0, 73.6], [80.0, 98.81], [101.0, 105.93], [109.0, 109.8], [111.0, 112.43], [113.0, 114.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.65, 34.86, 33.82, 33.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 25.43], ["speech", 9.35], ["groan", 8.66]], [["livestock, farm animals, working animals", 23.73], ["moo", 15.15], ["music", 14.69]], [["speech", 25.57], ["music", 20.57], ["didgeridoo", 6.75]], [["speech", 39.81], ["fart", 10.36], ["music", 6.69]], null, null, null], "duration": [-0.13, -0.39, 0.02, 0.4, 0.14, 0.09, 1.22, 0.34, 0.91, 0.0, 15.69, 8.6, 18.81, 4.93, 0.8, 1.43, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/hAQ2xTr4U64_filtered.json b/annotations_filtered/hAQ2xTr4U64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..269573b818033cd94cd1c259a324f2efcfacc4ff --- /dev/null +++ b/annotations_filtered/hAQ2xTr4U64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [5.0, 5.37], [7.0, 8.65], [14.0, 14.07], [15.0, 16.39], [18.0, 17.85], [19.0, 33.17], [37.0, 37.2], [39.0, 44.83], [47.0, 48.02], [50.0, 52.71], [61.0, 62.99], [64.0, 64.39], [65.0, 68.25], [69.0, 70.71], [73.0, 73.84], [75.0, 75.36], [78.0, 79.39], [82.0, 82.56], [85.0, 88.6], [90.0, 90.0], [90.0, 90.24], [92.0, 92.67], [95.0, 95.52], [97.0, 98.22], [99.0, 100.13], [101.0, 102.51], [103.0, 105.36], [107.0, 108.38], [109.0, 114.45], [118.0, 127.82], [128.0, 130.57], [131.0, 133.95], [137.0, 138.82], [139.0, 146.77], [149.0, 149.2], [152.0, 153.37], [158.0, 160.96], [162.0, 163.17], [169.0, 169.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 98.86, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 52.92, 52.39, 73.67, 54.1, 0.0, 98.51, 0.0, 0.0, 99.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.37, 1.65, 0.07, 1.39, -0.15, 14.17, 0.2, 5.83, 1.02, 2.71, 1.99, 0.39, 3.25, 1.71, 0.84, 0.36, 1.39, 0.56, 3.6, 0.0, 0.24, 0.67, 0.52, 1.22, 1.13, 1.51, 2.36, 1.38, 5.45, 9.82, 2.57, 2.95, 1.82, 7.77, 0.2, 1.37, 2.96, 1.17, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/hAU8AQ6xlw8_filtered.json b/annotations_filtered/hAU8AQ6xlw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40fe8756bed6f49a30c43970a2843368aa20c080 --- /dev/null +++ b/annotations_filtered/hAU8AQ6xlw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [11.0, 11.87], [13.0, 14.15], [15.0, 15.43], [18.0, 18.33], [19.0, 21.44], [22.0, 23.04], [31.0, 30.92], [32.0, 34.53], [35.0, 36.05], [37.0, 39.83], [47.0, 48.42], [55.0, 55.17], [60.0, 60.49], [65.0, 67.49], [70.0, 70.93], [76.0, 76.35], [107.0, 108.06], [114.0, 115.89], [117.0, 118.15], [121.0, 121.44], [123.0, 123.43], [124.0, 123.84], [140.0, 140.34], [144.0, 145.99], [148.0, 148.51], [149.0, 148.59], [149.0, 149.13], [151.0, 151.26], [154.0, 154.85], [158.0, 158.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.29, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 100.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.66, 0.87, 1.15, 0.43, 0.33, 2.44, 1.04, -0.08, 2.53, 1.05, 2.83, 1.42, 0.17, 0.49, 2.49, 0.93, 0.35, 1.06, 1.89, 1.15, 0.44, 0.43, -0.16, 0.34, 1.99, 0.51, -0.41, 0.13, 0.26, 0.85, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/hAUbdHw8QG4_filtered.json b/annotations_filtered/hAUbdHw8QG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a92dfbe23c51ae7f7fae32ed7cad7fd3b57e8369 --- /dev/null +++ b/annotations_filtered/hAUbdHw8QG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.76], [17.0, 20.88], [24.0, 24.27], [30.0, 37.81], [41.0, 44.74], [46.0, 48.84], [53.0, 54.16], [55.0, 73.14], [80.0, 82.8], [86.0, 98.83], [102.0, 104.38], [106.0, 108.18]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, false], "silence_prob": [0.0, 30.22, 0.0, 32.19, 32.26, 32.0, 0.0, 30.65, 30.38, 29.89, 33.37, 61.97], "audiomae_on_audioset": [null, [["speech", 35.04], ["music", 28.96], ["hum", 6.16]], null, [["music", 57.02], ["throbbing", 18.65], ["hum", 4.61]], [["music", 53.22], ["throbbing", 6.54], ["synthesizer", 5.15]], [["music", 61.36], ["speech", 7.9], ["synthesizer", 6.19]], null, [["music", 71.79], ["throbbing", 7.61], ["vehicle", 2.77]], [["music", 60.98], ["throbbing", 16.6], ["hum", 6.98]], [["music", 36.87], ["speech", 28.26], ["vehicle", 3.8]], [["music", 34.06], ["vehicle", 9.81], ["car", 7.26]], null], "duration": [0.76, 3.88, 0.27, 7.81, 3.74, 2.84, 1.16, 18.14, 2.8, 12.83, 2.38, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/hAbVFxYi_q0_filtered.json b/annotations_filtered/hAbVFxYi_q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088ee49b8ed653114aa1f2c584d49eb90a6b0b70 --- /dev/null +++ b/annotations_filtered/hAbVFxYi_q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [9.0, 14.13], [27.0, 27.28], [49.0, 49.0], [59.0, 59.76], [61.0, 61.35], [63.0, 63.27], [65.0, 65.99], [68.0, 68.13], [79.0, 79.02], [80.0, 80.11], [83.0, 84.37], [85.0, 85.14], [96.0, 96.99], [108.0, 108.21], [116.0, 118.18], [120.0, 120.97], [121.0, 124.66], [127.0, 127.82], [132.0, 132.6], [143.0, 143.4], [144.0, 145.1], [147.0, 146.67], [158.0, 159.76], [162.0, 162.41], [167.0, 167.46], [172.0, 172.05], [173.0, 173.18], [177.0, 179.83], [183.0, 185.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 92.8], "audiomae_on_audioset": [null, [["speech", 69.16], ["tap", 5.81], ["music", 4.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 5.13, 0.28, 0.0, 0.76, 0.35, 0.27, 0.99, 0.13, 0.02, 0.11, 1.37, 0.14, 0.99, 0.21, 2.18, 0.97, 3.66, 0.82, 0.6, 0.4, 1.1, -0.33, 1.76, 0.41, 0.46, 0.05, 0.18, 2.83, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/hAf3IBKWubo_filtered.json b/annotations_filtered/hAf3IBKWubo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c8d02b0dca194ccf88bb1ce7c949a21a897dff5 --- /dev/null +++ b/annotations_filtered/hAf3IBKWubo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 50.8], [56.0, 95.59], [104.0, 117.58], [120.0, 119.96], [122.0, 122.35], [127.0, 146.62], [152.0, 154.04], [156.0, 166.95], [176.0, 179.88], [182.0, 239.92], [241.0, 242.28], [248.0, 253.0]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, true], "silence_prob": [0.0, 0.0, 29.94, 0.0, 0.0, 31.09, 29.77, 29.19, 30.07, 0.0, 0.0, 28.67], "audiomae_on_audioset": [null, null, [["hum", 34.65], ["mains hum", 28.47], ["speech", 15.61]], null, null, [["music", 53.17], ["sonar", 8.6], ["synthesizer", 7.76]], [["hum", 20.91], ["music", 15.68], ["buzz", 11.16]], [["speech", 40.29], ["eruption", 14.21], ["explosion", 9.09]], [["music", 36.92], ["speech", 22.46], ["hum", 4.5]], null, null, [["speech", 27.51], ["vehicle", 13.24], ["motorcycle", 6.43]]], "duration": [47.8, 39.59, 13.58, -0.04, 0.35, 19.62, 2.04, 10.95, 3.88, 57.92, 1.28, 5.0]} \ No newline at end of file diff --git a/annotations_filtered/hAiiaFAJ1mY_filtered.json b/annotations_filtered/hAiiaFAJ1mY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4bcf64e927d5ae1ee008dbd00ead2f7bd74276b --- /dev/null +++ b/annotations_filtered/hAiiaFAJ1mY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.47], [16.0, 22.27], [23.0, 24.46], [25.0, 31.58], [34.0, 40.42], [42.0, 98.1], [99.0, 101.73], [104.0, 109.75]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 0.0, 99.99, 100.0, 0.0, 99.98, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [6.47, 6.27, 1.46, 6.58, 6.42, 56.1, 2.73, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/hAxEEf5p3Bw_filtered.json b/annotations_filtered/hAxEEf5p3Bw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fd9ec3dda6a17571aec2bad8827cbbad49a7d0d --- /dev/null +++ b/annotations_filtered/hAxEEf5p3Bw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.99], [10.0, 10.45], [11.0, 38.43], [41.0, 76.13], [76.0, 76.17], [77.0, 90.8]], "keep_status": [true, false, false, false, false, false], "silence_prob": [32.22, 0.0, 31.35, 0.0, 0.0, 31.75], "audiomae_on_audioset": [[["radio", 34.3], ["noise", 22.16], ["speech", 8.51]], null, [["speech", 65.99], ["music", 6.4], ["radio", 4.8]], null, null, [["vehicle", 41.49], ["car", 27.58], ["race car, auto racing", 7.94]]], "duration": [7.99, 0.45, 27.43, 35.13, 0.17, 13.8]} \ No newline at end of file diff --git a/annotations_filtered/hBsnb6M-lr0_filtered.json b/annotations_filtered/hBsnb6M-lr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdffe0cddd007ecda0935f50918f7fe019cf66a1 --- /dev/null +++ b/annotations_filtered/hBsnb6M-lr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.14], [15.0, 14.77], [16.0, 17.0], [18.0, 19.7], [22.0, 21.84], [26.0, 26.05], [27.0, 29.4], [30.0, 37.27], [38.0, 46.26], [50.0, 50.5], [52.0, 87.42], [90.0, 90.63], [91.0, 96.43], [97.0, 97.93], [104.0, 105.97], [107.0, 108.31], [109.0, 112.82]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 40.12, 33.12, 0.0, 0.0, 0.0, 35.37, 0.0, 0.0, 0.0, 32.11], "audiomae_on_audioset": [[["whale vocalization", 36.87], ["noise", 9.06], ["sidetone", 6.8]], null, null, null, null, null, null, [["music", 69.11], ["speech", 8.97], ["electronic music", 2.88]], [["music", 50.65], ["speech", 25.81], ["didgeridoo", 9.38]], null, null, null, [["music", 63.33], ["speech", 9.53], ["electric shaver, electric razor", 2.84]], null, null, null, [["music", 43.69], ["speech", 30.49], ["didgeridoo", 3.66]]], "duration": [6.14, -0.23, 1.0, 1.7, -0.16, 0.05, 2.4, 7.27, 8.26, 0.5, 35.42, 0.63, 5.43, 0.93, 1.97, 1.31, 3.82]} \ No newline at end of file diff --git a/annotations_filtered/hCN8UAdH55A_filtered.json b/annotations_filtered/hCN8UAdH55A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3199b64f905e9dabdff9064243a4b3999a0a10 --- /dev/null +++ b/annotations_filtered/hCN8UAdH55A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 80.67], [82.0, 82.16], [83.0, 84.67], [89.0, 89.48], [91.0, 97.17], [98.0, 98.78], [99.0, 99.47], [100.0, 100.2], [101.0, 101.87], [103.0, 105.19], [106.0, 106.47], [108.0, 108.13], [109.0, 110.32], [111.0, 111.38], [114.0, 115.65], [119.0, 121.07], [122.0, 123.55], [127.0, 128.01], [129.0, 129.36], [140.0, 143.58], [145.0, 145.96], [147.0, 146.96], [149.0, 149.79], [153.0, 153.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 0.0, 0.0, 31.53, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.87], ["hum", 7.6], ["rumble", 6.23]], null, null, null, [["bee, wasp, etc.", 22.64], ["insect", 8.47], ["vehicle", 6.24]], null, null, null, null], "duration": [63.67, 0.16, 1.67, 0.48, 6.17, 0.78, 0.47, 0.2, 0.87, 2.19, 0.47, 0.13, 1.32, 0.38, 1.65, 2.07, 1.55, 1.01, 0.36, 3.58, 0.96, -0.04, 0.79, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/hD7KaqFoSq0_filtered.json b/annotations_filtered/hD7KaqFoSq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d6690765d9290d511ebe78f1d30979dc3303edf --- /dev/null +++ b/annotations_filtered/hD7KaqFoSq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.51], [34.0, 61.82]], "keep_status": [false, false], "silence_prob": [0.0, 31.2], "audiomae_on_audioset": [null, [["music", 66.19], ["didgeridoo", 9.58], ["musical instrument", 3.16]]], "duration": [0.51, 27.82]} \ No newline at end of file diff --git a/annotations_filtered/hDA_Bn7UhlA_filtered.json b/annotations_filtered/hDA_Bn7UhlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..667b9c284098f410b89af2f39169ad7381867e92 --- /dev/null +++ b/annotations_filtered/hDA_Bn7UhlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 37.2], [37.0, 37.81], [39.0, 39.45], [40.0, 40.81], [42.0, 43.12], [44.0, 44.07], [46.0, 45.86], [48.0, 49.44], [50.0, 50.85], [52.0, 54.87], [56.0, 56.91], [58.0, 59.48], [60.0, 63.1], [66.0, 66.5], [67.0, 68.13], [69.0, 69.53], [71.0, 73.14], [77.0, 79.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 37.26, 0.0, 0.0, 0.0, 43.33, 36.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.84], ["crow", 21.63], ["animal", 16.82]], null, null, null, [["speech", 31.25], ["fart", 22.33], ["hum", 5.66]], [["speech", 47.18], ["animal", 7.25], ["sheep", 7.1]]], "duration": [11.2, 0.81, 0.45, 0.81, 1.12, 0.07, -0.14, 1.44, 0.85, 2.87, 0.91, 1.48, 3.1, 0.5, 1.13, 0.53, 2.14, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/hDH1ilg9NMU_filtered.json b/annotations_filtered/hDH1ilg9NMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09e3a97566e84f0ae41a3d69dd651c3d70760b0e --- /dev/null +++ b/annotations_filtered/hDH1ilg9NMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.94], [17.0, 17.86], [20.0, 21.03], [22.0, 22.55], [33.0, 32.88], [34.0, 34.45], [37.0, 37.1], [40.0, 41.13], [43.0, 43.02], [47.0, 47.04], [48.0, 48.68], [49.0, 50.14], [53.0, 53.06], [54.0, 54.45], [62.0, 62.45], [64.0, 65.87], [67.0, 71.9], [86.0, 89.01], [91.0, 91.1], [105.0, 105.44], [107.0, 107.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 53.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.67], ["chirp tone", 15.17], ["stomach rumble", 9.93]], null, null, null, null], "duration": [-0.06, 0.86, 1.03, 0.55, -0.12, 0.45, 0.1, 1.13, 0.02, 0.04, 0.68, 1.14, 0.06, 0.45, 0.45, 1.87, 4.9, 3.01, 0.1, 0.44, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/hE3jShGPscQ_filtered.json b/annotations_filtered/hE3jShGPscQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8679e048d76d92e654546f6e2be89033dcafa5 --- /dev/null +++ b/annotations_filtered/hE3jShGPscQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.32], [5.0, 5.49], [7.0, 6.62], [9.0, 9.76], [12.0, 13.44], [14.0, 16.01], [25.0, 26.47], [31.0, 85.18], [86.0, 86.91], [88.0, 88.13], [90.0, 90.8], [92.0, 95.0], [96.0, 96.55], [99.0, 99.59], [101.0, 101.44], [104.0, 104.41], [105.0, 116.29], [117.0, 116.67], [117.0, 116.95], [117.0, 144.96], [145.0, 152.2], [161.0, 175.44], [177.0, 177.58]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.7, 0.0, 0.0, 0.0, 0.0, 0.0, 38.14, 0.0, 0.0, 0.0, 0.0, 48.52, 0.0, 0.0, 31.66, 30.59, 33.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 17.45], ["dog", 13.68], ["howl", 11.72]], null, null, null, null, null, [["mains hum", 31.23], ["hum", 25.27], ["music", 5.35]], null, null, null, null, [["music", 56.47], ["theremin", 17.73], ["musical instrument", 4.71]], null, null, [["speech", 35.82], ["hum", 23.18], ["mains hum", 8.79]], [["music", 60.2], ["didgeridoo", 12.04], ["hum", 5.47]], [["music", 59.02], ["didgeridoo", 21.21], ["synthesizer", 3.96]], null], "duration": [1.32, 0.49, -0.38, 0.76, 1.44, 2.01, 1.47, 54.18, 0.91, 0.13, 0.8, 3.0, 0.55, 0.59, 0.44, 0.41, 11.29, -0.33, -0.05, 27.96, 7.2, 14.44, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/hE5rsmIsYPA_filtered.json b/annotations_filtered/hE5rsmIsYPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..393f74ae66ed48c2b7c00b2c1dd8daa078e05720 --- /dev/null +++ b/annotations_filtered/hE5rsmIsYPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 67.22], [68.0, 95.76], [96.0, 97.82], [99.0, 100.11]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 47.5, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 23.23], ["speech", 14.7], ["mains hum", 11.86]], null, null], "duration": [1.22, 27.76, 1.82, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/hE7Nc_la-l0_filtered.json b/annotations_filtered/hE7Nc_la-l0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e243f31082d5e9cffea8403c718877d74b12c6e --- /dev/null +++ b/annotations_filtered/hE7Nc_la-l0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [4.0, 4.53], [14.0, 14.18], [16.0, 16.71], [27.0, 27.36], [39.0, 39.36], [41.0, 41.93], [55.0, 59.27], [61.0, 61.72], [64.0, 64.05], [65.0, 65.91], [67.0, 67.14], [68.0, 68.61], [70.0, 70.44], [75.0, 75.95], [81.0, 81.75], [83.0, 83.17], [93.0, 93.73], [95.0, 97.11], [97.0, 98.14], [103.0, 107.76], [108.0, 109.34], [109.0, 110.34], [112.0, 112.23], [113.0, 113.53], [115.0, 118.83], [120.0, 123.57], [126.0, 126.37], [128.0, 129.98], [131.0, 134.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.96, 0.0, 0.0, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.53, 0.18, 0.71, 0.36, 0.36, 0.93, 4.27, 0.72, 0.05, 0.91, 0.14, 0.61, 0.44, 0.95, 0.75, 0.17, 0.73, 2.11, 1.14, 4.76, 1.34, 1.34, 0.23, 0.53, 3.83, 3.57, 0.37, 1.98, 3.86]} \ No newline at end of file diff --git a/annotations_filtered/hEDeIvU1si8_filtered.json b/annotations_filtered/hEDeIvU1si8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e1c15f034bc0dd412c9cae04e5d86ab27f82c1 --- /dev/null +++ b/annotations_filtered/hEDeIvU1si8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.76], [11.0, 11.38], [16.0, 19.48], [19.0, 19.52], [20.0, 19.55], [21.0, 29.46], [34.0, 42.94], [44.0, 44.71], [47.0, 50.06], [51.0, 60.0], [61.0, 67.42], [71.0, 81.03], [83.0, 83.29], [84.0, 84.2], [92.0, 95.4], [97.0, 97.34], [99.0, 99.67], [100.0, 99.94], [101.0, 101.98], [106.0, 107.89], [111.0, 121.09], [123.0, 134.69], [137.0, 161.18], [165.0, 165.62], [166.0, 167.32]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 89.19, 0.0, 0.0, 54.56, 44.07, 0.0, 33.16, 32.77, 33.76, 33.16, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 29.49, 37.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 39.43], ["didgeridoo", 20.82], ["music", 13.29]], null, [["speech", 46.78], ["crowd", 6.25], ["cattle, bovinae", 5.57]], [["speech", 87.16], ["crowd", 3.06], ["applause", 2.12]], [["speech", 80.42], ["livestock, farm animals, working animals", 3.76], ["sheep", 3.62]], [["speech", 21.23], ["livestock, farm animals, working animals", 14.44], ["animal", 13.61]], null, null, [["didgeridoo", 69.8], ["music", 19.52], ["beatboxing", 4.85]], null, null, null, null, null, [["didgeridoo", 67.63], ["music", 5.45], ["cattle, bovinae", 5.38]], [["cheering", 30.88], ["speech", 25.15], ["crowd", 12.8]], [["speech", 34.85], ["music", 10.89], ["whale vocalization", 10.15]], null, null], "duration": [1.76, 0.38, 3.48, 0.52, -0.45, 8.46, 8.94, 0.71, 3.06, 9.0, 6.42, 10.03, 0.29, 0.2, 3.4, 0.34, 0.67, -0.06, 0.98, 1.89, 10.09, 11.69, 24.18, 0.62, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/hEH49mSRWGw_filtered.json b/annotations_filtered/hEH49mSRWGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68fccb8e892fa515357127c0c6d25c21352ddd4 --- /dev/null +++ b/annotations_filtered/hEH49mSRWGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.42], [14.0, 17.59], [24.0, 25.39], [29.0, 31.65], [33.0, 34.69], [37.0, 42.13], [53.0, 56.19], [58.0, 58.62], [61.0, 61.97], [67.0, 68.3], [71.0, 71.56], [79.0, 80.2], [91.0, 91.59], [93.0, 95.07], [96.0, 98.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 86.27, 0.0, 57.89, 0.0, 36.05, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 38.67], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 52.23], ["music", 40.14], ["thunk", 2.93]], null, null, null, null, null, null, null, null, [["music", 27.18], ["thunk", 15.05], ["speech", 14.81]]], "duration": [0.42, 3.59, 1.39, 2.65, 1.69, 5.13, 3.19, 0.62, 0.97, 1.3, 0.56, 1.2, 0.59, 2.07, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/hERyYjy3O3U_filtered.json b/annotations_filtered/hERyYjy3O3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26a04a60d2c433cdfe5b8ee56337f46d11f44575 --- /dev/null +++ b/annotations_filtered/hERyYjy3O3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.08], [34.0, 33.98], [37.0, 37.32], [41.0, 41.32], [42.0, 42.03], [44.0, 44.05], [47.0, 47.65], [53.0, 53.3]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.08, -0.02, 0.32, 0.32, 0.03, 0.05, 0.65, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/hEXsOOVWuGA_filtered.json b/annotations_filtered/hEXsOOVWuGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84cd2ba8ce59ccf8a76fbd9dea3bd4c1f74796d1 --- /dev/null +++ b/annotations_filtered/hEXsOOVWuGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.15], [4.0, 8.85], [10.0, 11.06], [12.0, 11.84], [13.0, 14.44], [15.0, 17.81], [20.0, 64.29], [66.0, 88.03], [89.0, 90.39], [91.0, 102.39], [104.0, 106.42], [108.0, 109.66], [113.0, 114.81], [118.0, 123.33], [125.0, 126.91]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.0, 0.0, 0.0, 0.0, 49.36, 0.0, 30.89, 0.0, 91.81, 94.22, 0.0, 0.0, 84.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.59], ["synthesizer", 5.02], ["sound effect", 4.82]], null, [["music", 20.86], ["hum", 9.68], ["whack, thwack", 8.84]], null, null, null, null, null, null, null], "duration": [1.15, 4.85, 1.06, -0.16, 1.44, 2.81, 44.29, 22.03, 1.39, 11.39, 2.42, 1.66, 1.81, 5.33, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/hEY2L9sXjwU_filtered.json b/annotations_filtered/hEY2L9sXjwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c534de7c59e5c39f86bf57b117317621eda0e2d5 --- /dev/null +++ b/annotations_filtered/hEY2L9sXjwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 18.76], [19.0, 26.54], [32.0, 80.76], [83.0, 89.77], [90.0, 90.58], [92.0, 101.02], [104.0, 116.95], [120.0, 121.2], [122.0, 124.31], [126.0, 130.98]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [83.34, 64.07, 0.0, 36.96, 0.0, 38.47, 44.23, 0.0, 78.38, 84.07], "audiomae_on_audioset": [null, null, null, [["music", 61.44], ["chant", 2.35], ["middle eastern music", 1.77]], null, [["music", 82.05], ["vocal music", 1.91], ["mantra", 1.47]], [["music", 86.15], ["musical instrument", 1.03], ["singing", 0.94]], null, null, null], "duration": [15.76, 7.54, 48.76, 6.77, 0.58, 9.02, 12.95, 1.2, 2.31, 4.98]} \ No newline at end of file diff --git a/annotations_filtered/hEZcqWRB2iU_filtered.json b/annotations_filtered/hEZcqWRB2iU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aca13d1354cc0448fe797ed0fd5cd0ed3dc2004c --- /dev/null +++ b/annotations_filtered/hEZcqWRB2iU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.55], [15.0, 15.79], [23.0, 25.19], [27.0, 27.7], [29.0, 29.71], [31.0, 34.47], [36.0, 36.86], [39.0, 39.7], [43.0, 43.66], [45.0, 46.36], [48.0, 131.6]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.88, 0.0, 0.0, 32.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 26.55], ["music", 7.75], ["fly, housefly", 5.08]], null, null, [["animal", 20.99], ["whale vocalization", 18.93], ["wild animals", 10.19]], null, null, null, null, null], "duration": [0.55, 0.79, 2.19, 0.7, 0.71, 3.47, 0.86, 0.7, 0.66, 1.36, 83.6]} \ No newline at end of file diff --git a/annotations_filtered/hFJlpOjXf9s_filtered.json b/annotations_filtered/hFJlpOjXf9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2de2d9323a23295028a6dc808ef89261d5133116 --- /dev/null +++ b/annotations_filtered/hFJlpOjXf9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.68], [6.0, 8.92], [10.0, 10.69], [11.0, 14.76], [15.0, 17.59], [19.0, 52.07], [55.0, 117.86], [118.0, 120.82], [122.0, 127.57]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [100.0, 38.55, 0.0, 100.0, 100.0, 0.0, 0.0, 74.6, 95.78], "audiomae_on_audioset": [null, [["whale vocalization", 18.01], ["shofar", 9.62], ["gong", 7.89]], null, null, null, null, null, null, null], "duration": [2.68, 2.92, 0.69, 3.76, 2.59, 33.07, 62.86, 2.82, 5.57]} \ No newline at end of file diff --git a/annotations_filtered/hF_9GQFISow_filtered.json b/annotations_filtered/hF_9GQFISow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b34f39dfa7db41564337ee72694bbf2e9b8b3356 --- /dev/null +++ b/annotations_filtered/hF_9GQFISow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.16], [24.0, 25.15], [28.0, 28.54], [31.0, 38.69], [44.0, 44.19], [48.0, 50.3], [50.0, 52.02], [71.0, 71.25], [86.0, 86.41], [104.0, 105.14], [109.0, 118.98], [130.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.83, 0.0, 0.0, 29.66, 0.0, 31.89, 30.99, 0.0, 0.0, 0.0, 31.72, 0.0], "audiomae_on_audioset": [[["music", 81.39], ["synthesizer", 2.44], ["sampler", 1.79]], null, null, [["music", 68.12], ["synthesizer", 7.63], ["musical instrument", 3.36]], null, [["music", 57.87], ["speech", 23.91], ["livestock, farm animals, working animals", 1.14]], [["speech", 43.17], ["music", 34.31], ["synthesizer", 3.4]], null, null, null, [["music", 62.02], ["synthesizer", 10.06], ["speech", 7.39]], null], "duration": [2.16, 1.15, 0.54, 7.69, 0.19, 2.3, 2.02, 0.25, 0.41, 1.14, 9.98, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/hFfQhVgQU44_filtered.json b/annotations_filtered/hFfQhVgQU44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97596821912127285637cea331dca26855616048 --- /dev/null +++ b/annotations_filtered/hFfQhVgQU44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.82], [13.0, 13.53], [15.0, 14.99], [22.0, 22.44], [25.0, 25.42], [30.0, 31.31], [40.0, 45.05], [46.0, 46.8], [80.0, 83.32], [86.0, 86.39], [96.0, 97.95], [99.0, 100.45], [155.0, 155.53], [158.0, 158.58], [160.0, 161.37], [166.0, 167.41], [187.0, 189.85], [193.0, 195.12], [202.0, 202.69], [204.0, 206.42], [219.0, 221.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 0.0, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.66, 31.04, 0.0, 35.47, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 75.03], ["synthesizer", 8.75], ["throbbing", 2.96]], null, null, null, null, null, null, null, null, null, [["music", 24.42], ["mosquito", 4.85], ["carnatic music", 3.97]], [["music", 49.01], ["speech", 16.79], ["synthesizer", 5.8]], null, [["speech", 58.8], ["music", 21.93], ["quack", 6.46]], [["music", 72.39], ["effects unit", 6.26], ["guitar", 5.21]]], "duration": [4.82, 0.53, -0.01, 0.44, 0.42, 1.31, 5.05, 0.8, 3.32, 0.39, 1.95, 1.45, 0.53, 0.58, 1.37, 1.41, 2.85, 2.12, 0.69, 2.42, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/hFjIRET64r4_filtered.json b/annotations_filtered/hFjIRET64r4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c6073b645a525cfd77721ea536c78b813d1b511 --- /dev/null +++ b/annotations_filtered/hFjIRET64r4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.08], [12.0, 11.89], [13.0, 14.35], [15.0, 16.5], [18.0, 19.16], [30.0, 30.18], [31.0, 31.51], [33.0, 35.38], [39.0, 39.12], [40.0, 46.06], [48.0, 48.52], [51.0, 51.93], [52.0, 53.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 46.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["mains hum", 40.13], ["hum", 28.29], ["noise", 10.02]], null, null, null], "duration": [0.08, -0.11, 1.35, 1.5, 1.16, 0.18, 0.51, 2.38, 0.12, 6.06, 0.52, 0.93, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/hFoLv3bTLSc_filtered.json b/annotations_filtered/hFoLv3bTLSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec84b0ec3c87f362b830f37221ecb5bfe048ac2a --- /dev/null +++ b/annotations_filtered/hFoLv3bTLSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.48], [13.0, 15.94], [17.0, 16.73], [17.0, 18.0], [28.0, 31.6], [34.0, 37.02], [38.0, 43.11], [45.0, 46.85], [50.0, 51.65], [54.0, 56.24], [61.0, 63.39], [68.0, 73.23], [74.0, 77.45], [81.0, 80.97], [82.0, 88.33], [90.0, 89.92]], "keep_status": [false, true, false, false, true, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 49.59, 0.0, 0.0, 48.14, 99.26, 64.29, 0.0, 0.0, 35.05, 46.75, 36.13, 41.89, 0.0, 38.11, 0.0], "audiomae_on_audioset": [null, [["speech", 44.44], ["sidetone", 8.72], ["whale vocalization", 4.32]], null, null, [["animal", 24.28], ["speech", 21.89], ["wild animals", 9.28]], null, null, null, null, [["music", 48.58], ["musical instrument", 10.53], ["trombone", 4.86]], [["cattle, bovinae", 20.39], ["livestock, farm animals, working animals", 18.76], ["moo", 16.84]], [["boing", 28.27], ["speech", 24.68], ["fly, housefly", 21.35]], [["speech", 20.23], ["music", 17.03], ["throbbing", 12.82]], null, [["livestock, farm animals, working animals", 48.04], ["cattle, bovinae", 29.05], ["moo", 20.79]], null], "duration": [0.48, 2.94, -0.27, 1.0, 3.6, 3.02, 5.11, 1.85, 1.65, 2.24, 2.39, 5.23, 3.45, -0.03, 6.33, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/hG6DmzzU8m0_filtered.json b/annotations_filtered/hG6DmzzU8m0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..589e60797a4acfa1f163b7b5a79bf53e39badb78 --- /dev/null +++ b/annotations_filtered/hG6DmzzU8m0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [11.0, 11.7], [24.0, 24.81], [26.0, 26.82], [28.0, 28.07], [28.0, 32.37], [35.0, 35.21]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.05], ["speech", 27.68], ["didgeridoo", 17.03]], null], "duration": [0.02, 0.7, 0.81, 0.82, 0.07, 4.37, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/hGOHE1zqEmY_filtered.json b/annotations_filtered/hGOHE1zqEmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..603bce37c19a448e9e04cd1c974495ec89225c7e --- /dev/null +++ b/annotations_filtered/hGOHE1zqEmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.01], [8.0, 8.09], [11.0, 11.38], [14.0, 20.41], [22.0, 27.67], [29.0, 40.54], [41.0, 41.52], [43.0, 46.06], [47.0, 49.82], [55.0, 57.01], [60.0, 62.43], [63.0, 68.79], [70.0, 70.88], [73.0, 74.01], [75.0, 75.54], [77.0, 77.55], [81.0, 81.67], [83.0, 83.61], [85.0, 86.48], [89.0, 89.18], [91.0, 91.37], [94.0, 93.99], [95.0, 95.28], [96.0, 96.58], [98.0, 104.46], [106.0, 106.1], [106.0, 106.49], [113.0, 114.32]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.35, 0.0, 0.0, 37.38, 72.75, 47.16, 0.0, 99.68, 46.72, 97.54, 40.36, 34.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.24, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 75.13], ["speech synthesizer", 4.94], ["hum", 3.34]], null, null, [["speech", 59.43], ["mains hum", 10.64], ["hum", 7.03]], null, [["sidetone", 23.45], ["electric shaver, electric razor", 13.73], ["mains hum", 12.74]], null, null, [["speech", 56.52], ["busy signal", 7.74], ["dial tone", 6.06]], null, [["speech", 44.32], ["sine wave", 21.29], ["dial tone", 19.86]], [["speech", 75.02], ["didgeridoo", 6.16], ["music", 5.37]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.71], ["typewriter", 2.79], ["hands", 2.69]], null, null, null], "duration": [3.01, 0.09, 0.38, 6.41, 5.67, 11.54, 0.52, 3.06, 2.82, 2.01, 2.43, 5.79, 0.88, 1.01, 0.54, 0.55, 0.67, 0.61, 1.48, 0.18, 0.37, -0.01, 0.28, 0.58, 6.46, 0.1, 0.49, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/hGgWUKweXzI_filtered.json b/annotations_filtered/hGgWUKweXzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1dca56a3a9d5338831dcd4ef955dd360de0949a --- /dev/null +++ b/annotations_filtered/hGgWUKweXzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.79], [23.0, 29.37], [31.0, 122.94], [125.0, 126.72]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 32.13, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.31], ["speech", 17.82], ["boing", 12.6]], null, null], "duration": [1.79, 6.37, 91.94, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/hGuXSd2s0jI_filtered.json b/annotations_filtered/hGuXSd2s0jI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7c370fe3eb41532e580ad3e169e7201d78bf71 --- /dev/null +++ b/annotations_filtered/hGuXSd2s0jI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.27], [25.0, 26.43], [28.0, 33.78], [35.0, 37.59], [43.0, 43.93], [46.0, 56.19], [57.0, 97.02]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [37.03, 0.0, 38.97, 52.39, 0.0, 64.86, 0.0], "audiomae_on_audioset": [[["music", 32.41], ["speech", 13.38], ["musical instrument", 5.82]], null, [["fly, housefly", 44.39], ["insect", 33.62], ["bee, wasp, etc.", 11.88]], null, null, null, null], "duration": [4.27, 1.43, 5.78, 2.59, 0.93, 10.19, 40.02]} \ No newline at end of file diff --git a/annotations_filtered/hH0av1iDYVI_filtered.json b/annotations_filtered/hH0av1iDYVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..188d9589f3037ad4ceaab265d520cdf3b420a82f --- /dev/null +++ b/annotations_filtered/hH0av1iDYVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.07], [17.0, 19.03], [20.0, 21.27], [23.0, 23.08], [25.0, 29.88], [33.0, 54.9], [61.0, 62.31], [63.0, 63.9], [65.0, 80.1], [81.0, 85.99], [87.0, 107.59], [109.0, 111.97], [112.0, 127.58]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 76.86, 0.0, 0.0, 51.18, 40.82, 0.0, 0.0, 34.49, 37.46, 35.68, 39.52, 34.46], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.98], ["synthesizer", 5.06], ["musical instrument", 4.77]], null, null, [["music", 40.02], ["fly, housefly", 12.11], ["groan", 12.05]], [["boing", 60.55], ["music", 21.9], ["speech", 3.03]], [["music", 43.94], ["fly, housefly", 21.93], ["insect", 6.0]], [["music", 78.0], ["synthesizer", 2.02], ["musical instrument", 1.58]], [["music", 27.46], ["boing", 16.27], ["whack, thwack", 13.0]]], "duration": [1.07, 2.03, 1.27, 0.08, 4.88, 21.9, 1.31, 0.9, 15.1, 4.99, 20.59, 2.97, 15.58]} \ No newline at end of file diff --git a/annotations_filtered/hH1TgDvC7sY_filtered.json b/annotations_filtered/hH1TgDvC7sY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe286a82b2211f6dee38899166fd2e0eff3c9605 --- /dev/null +++ b/annotations_filtered/hH1TgDvC7sY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.76], [21.0, 21.0], [21.0, 22.2], [24.0, 56.29], [57.0, 69.18], [71.0, 71.56], [74.0, 119.94], [120.0, 120.99], [123.0, 154.7], [157.0, 157.81], [159.0, 161.03], [162.0, 162.8], [163.0, 164.94], [169.0, 169.92], [170.0, 181.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [32.26, 0.0, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0, 0.0, 34.43], "audiomae_on_audioset": [[["speech", 19.33], ["electric shaver, electric razor", 13.22], ["groan", 8.52]], null, null, null, [["hum", 48.58], ["mains hum", 16.4], ["throbbing", 15.72]], null, null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 23.87], ["fly, housefly", 11.02], ["buzz", 9.47]]], "duration": [11.76, 0.0, 1.2, 32.29, 12.18, 0.56, 45.94, 0.99, 31.7, 0.81, 2.03, 0.8, 1.94, 0.92, 11.45]} \ No newline at end of file diff --git a/annotations_filtered/hH3peh07eq4_filtered.json b/annotations_filtered/hH3peh07eq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a22fa9d5b872159f8a42448a6c18e200862d19d --- /dev/null +++ b/annotations_filtered/hH3peh07eq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.09], [3.0, 3.84], [15.0, 16.31], [18.0, 18.37], [31.0, 32.09], [36.0, 36.54], [41.0, 41.84], [44.0, 44.61], [56.0, 56.39], [57.0, 58.19], [65.0, 65.01], [67.0, 67.24], [78.0, 80.38], [82.0, 83.46], [95.0, 95.25], [112.0, 112.26], [113.0, 114.22], [115.0, 115.74], [134.0, 134.03], [146.0, 152.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.84, 1.31, 0.37, 1.09, 0.54, 0.84, 0.61, 0.39, 1.19, 0.01, 0.24, 2.38, 1.46, 0.25, 0.26, 1.22, 0.74, 0.03, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/hHC_R7ATGuI_filtered.json b/annotations_filtered/hHC_R7ATGuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/hHC_R7ATGuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/hHKUBg_c9no_filtered.json b/annotations_filtered/hHKUBg_c9no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd5b342ab90638f5d628d75e6d6e240aef162e02 --- /dev/null +++ b/annotations_filtered/hHKUBg_c9no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.26], [38.0, 39.24], [41.0, 41.84], [44.0, 58.56], [60.0, 60.07], [62.0, 63.27], [64.0, 94.96], [98.0, 98.78], [107.0, 107.72], [113.0, 117.31], [119.0, 120.26], [121.0, 121.83], [123.0, 123.62]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["breaking", 28.22], ["sound effect", 13.66], ["whack, thwack", 11.54]], null, null, null, null, null, [["music", 56.71], ["didgeridoo", 7.2], ["double bass", 4.91]], null, null, null], "duration": [0.26, 1.24, 0.84, 14.56, 0.07, 1.27, 30.96, 0.78, 0.72, 4.31, 1.26, 0.83, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/hHVZ_viVD9E_filtered.json b/annotations_filtered/hHVZ_viVD9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ffd4fa8b8e1eb7dd41ce811aa59dee63fddebb --- /dev/null +++ b/annotations_filtered/hHVZ_viVD9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.74], [16.0, 16.46], [20.0, 20.53], [27.0, 28.16], [29.0, 29.88], [31.0, 31.58], [32.0, 33.2], [34.0, 34.94], [39.0, 39.9], [48.0, 48.63], [51.0, 51.41], [63.0, 63.68], [75.0, 76.89], [82.0, 83.88], [85.0, 85.4], [90.0, 90.46], [93.0, 94.69], [98.0, 100.2], [101.0, 102.1], [104.0, 107.82], [109.0, 109.8], [112.0, 113.58], [116.0, 116.67], [118.0, 117.8], [120.0, 120.26], [130.0, 130.4], [131.0, 132.02], [135.0, 134.99], [135.0, 137.12], [138.0, 139.72], [142.0, 145.86], [147.0, 150.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 0.0, 62.07, 34.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.64], ["mains hum", 12.3], ["busy signal", 5.86]], null, null, [["music", 43.41], ["ambient music", 13.79], ["theremin", 8.42]]], "duration": [0.74, 0.46, 0.53, 1.16, 0.88, 0.58, 1.2, 0.94, 0.9, 0.63, 0.41, 0.68, 1.89, 1.88, 0.4, 0.46, 1.69, 2.2, 1.1, 3.82, 0.8, 1.58, 0.67, -0.2, 0.26, 0.4, 1.02, -0.01, 2.12, 1.72, 3.86, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/hHWcoaM_59E_filtered.json b/annotations_filtered/hHWcoaM_59E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3387afeb4f1da23d9c93bbe706ad1b7c098f52 --- /dev/null +++ b/annotations_filtered/hHWcoaM_59E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.86], [9.0, 11.55], [12.0, 13.2], [14.0, 15.33], [18.0, 19.65], [22.0, 22.3], [23.0, 24.65], [26.0, 27.55], [28.0, 29.83], [32.0, 32.86], [36.0, 36.98], [38.0, 37.71], [38.0, 39.95], [40.0, 41.23], [43.0, 46.09], [49.0, 50.38], [51.0, 53.2], [56.0, 56.37], [59.0, 61.45], [66.0, 66.6], [67.0, 71.54], [74.0, 75.64], [77.0, 77.43], [80.0, 82.09], [84.0, 84.92], [86.0, 88.13], [90.0, 93.58], [95.0, 96.42], [98.0, 98.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.91, 0.0, 46.4, 0.0, 49.5, 0.0, 44.57, 0.0, 0.0, 41.56, 0.0, 47.94, 45.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.54], ["speech", 12.1], ["gong", 7.08]], null, [["music", 53.65], ["guitar", 14.82], ["musical instrument", 5.93]], null, [["music", 68.18], ["musical instrument", 7.62], ["plucked string instrument", 4.57]], null, [["music", 42.28], ["guitar", 14.56], ["musical instrument", 10.41]], null, null, [["music", 36.63], ["guitar", 10.86], ["quack", 8.8]], null, [["music", 77.49], ["musical instrument", 5.88], ["plucked string instrument", 3.99]], [["music", 49.01], ["sitar", 13.1], ["didgeridoo", 3.74]], null, null], "duration": [1.86, 2.55, 1.2, 1.33, 1.65, 0.3, 1.65, 1.55, 1.83, 0.86, 0.98, -0.29, 1.95, 1.23, 3.09, 1.38, 2.2, 0.37, 2.45, 0.6, 4.54, 1.64, 0.43, 2.09, 0.92, 2.13, 3.58, 1.42, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/hHZs6i30Xr4_filtered.json b/annotations_filtered/hHZs6i30Xr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e09c993367e0a00cf5a612237f1e6848d2561fa9 --- /dev/null +++ b/annotations_filtered/hHZs6i30Xr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.55], [24.0, 24.75], [27.0, 28.27], [30.0, 30.65], [49.0, 49.72], [51.0, 51.0], [52.0, 53.97], [60.0, 61.97], [63.0, 72.12], [73.0, 73.67], [77.0, 79.73], [81.0, 81.92], [85.0, 87.51], [88.0, 89.4], [92.0, 93.21], [94.0, 95.72], [97.0, 103.87], [105.0, 107.37], [109.0, 109.43], [112.0, 112.33], [113.0, 115.59], [117.0, 117.78], [119.0, 118.86], [120.0, 120.02], [120.0, 120.97], [121.0, 122.93], [125.0, 126.71], [127.0, 127.36], [127.0, 127.48], [129.0, 129.76], [136.0, 136.56], [137.0, 139.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 0.75, 1.27, 0.65, 0.72, 0.0, 1.97, 1.97, 9.12, 0.67, 2.73, 0.92, 2.51, 1.4, 1.21, 1.72, 6.87, 2.37, 0.43, 0.33, 2.59, 0.78, -0.14, 0.02, 0.97, 1.93, 1.71, 0.36, 0.48, 0.76, 0.56, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/hHibPPRQB40_filtered.json b/annotations_filtered/hHibPPRQB40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa8aa22fcb7e18114cc7ae4a8548ea93c0122f9d --- /dev/null +++ b/annotations_filtered/hHibPPRQB40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.9], [1.0, 2.42], [3.0, 3.7], [5.0, 15.15], [16.0, 17.12], [20.0, 45.49], [66.0, 67.37], [69.0, 69.52], [71.0, 71.37], [75.0, 74.93], [76.0, 76.35], [77.0, 77.52], [79.0, 79.54], [80.0, 80.76], [81.0, 86.07], [88.0, 88.7], [90.0, 95.49], [96.0, 96.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.87, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 64.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 1.42, 0.7, 10.15, 1.12, 25.49, 1.37, 0.52, 0.37, -0.07, 0.35, 0.52, 0.54, 0.76, 5.07, 0.7, 5.49, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/hIHC635Q9dc_filtered.json b/annotations_filtered/hIHC635Q9dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38b1ef476583aa6cf240857551f14d82df82b33b --- /dev/null +++ b/annotations_filtered/hIHC635Q9dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [14.0, 15.09], [29.0, 30.82], [71.0, 72.69], [81.0, 82.32], [103.0, 104.62], [133.0, 134.74]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.86, 1.09, 1.82, 1.69, 1.32, 1.62, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/hIJ0gMDZT_4_filtered.json b/annotations_filtered/hIJ0gMDZT_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a4c055eb11d5ba2654bb4e17adcc094b0fec690 --- /dev/null +++ b/annotations_filtered/hIJ0gMDZT_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [7.0, 33.64], [57.0, 57.6], [61.0, 61.47], [63.0, 63.81], [71.0, 71.54], [74.0, 76.27], [78.0, 79.59], [82.0, 85.21], [87.0, 88.8], [89.0, 102.56], [103.0, 102.86], [104.0, 104.7], [108.0, 108.51], [114.0, 122.15], [123.0, 125.79], [131.0, 140.21], [143.0, 159.8], [172.0, 183.44], [184.0, 189.03]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 88.83, 0.0, 56.03, 0.0, 0.0, 0.0, 31.26, 30.84, 31.19, 31.75, 30.69, 33.01], "audiomae_on_audioset": [null, [["music", 28.93], ["speech", 11.34], ["groan", 8.64]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.91], ["musical instrument", 5.04], ["guitar", 1.81]], [["music", 55.9], ["didgeridoo", 4.63], ["electronic music", 4.37]], [["music", 58.45], ["speech", 16.08], ["electronic music", 3.44]], [["music", 65.19], ["synthesizer", 4.51], ["throbbing", 4.49]], [["music", 50.72], ["animal", 24.56], ["neigh, whinny", 13.48]], [["music", 25.04], ["speech", 24.59], ["boing", 18.02]]], "duration": [0.58, 26.64, 0.6, 0.47, 0.81, 0.54, 2.27, 1.59, 3.21, 1.8, 13.56, -0.14, 0.7, 0.51, 8.15, 2.79, 9.21, 16.8, 11.44, 5.03]} \ No newline at end of file diff --git a/annotations_filtered/hIMv_pWXqFY_filtered.json b/annotations_filtered/hIMv_pWXqFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c916c63b39bcd0b881a480d9ce3324b07be21a1 --- /dev/null +++ b/annotations_filtered/hIMv_pWXqFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.39], [15.0, 17.31], [18.0, 31.06], [31.0, 36.8], [40.0, 40.19], [41.0, 42.16], [43.0, 44.0], [45.0, 46.01], [47.0, 51.68], [52.0, 62.63], [64.0, 66.45], [71.0, 81.26], [82.0, 83.64], [85.0, 87.51], [89.0, 99.49], [100.0, 101.11], [102.0, 104.94], [105.0, 112.7], [113.0, 118.32], [122.0, 123.65], [125.0, 126.08], [128.0, 129.57], [136.0, 136.76], [139.0, 141.72], [143.0, 151.48]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [97.43, 99.88, 92.15, 46.19, 0.0, 0.0, 0.0, 0.0, 93.45, 59.96, 57.97, 88.83, 0.0, 82.07, 50.97, 0.0, 57.25, 48.61, 52.68, 0.0, 0.0, 0.0, 0.0, 81.17, 74.76], "audiomae_on_audioset": [null, null, null, [["speech", 33.69], ["music", 21.14], ["singing bowl", 14.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.49], ["singing bowl", 15.42], ["theremin", 10.72]], null, null, null, null, null, null, null], "duration": [12.39, 2.31, 13.06, 5.8, 0.19, 1.16, 1.0, 1.01, 4.68, 10.63, 2.45, 10.26, 1.64, 2.51, 10.49, 1.11, 2.94, 7.7, 5.32, 1.65, 1.08, 1.57, 0.76, 2.72, 8.48]} \ No newline at end of file diff --git a/annotations_filtered/hITWJ6vE1os_filtered.json b/annotations_filtered/hITWJ6vE1os_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a3455024fe3eacdde38a648d260d8ed8954fd40 --- /dev/null +++ b/annotations_filtered/hITWJ6vE1os_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [9.0, 9.37], [11.0, 10.84], [12.0, 12.9], [16.0, 64.59], [65.0, 102.56], [106.0, 107.32], [108.0, 116.97], [125.0, 126.18], [129.0, 128.55], [129.0, 129.78], [131.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 35.44], ["music", 20.0], ["whack, thwack", 13.59]], null, null, null, null], "duration": [0.55, 0.37, -0.16, 0.9, 48.59, 37.56, 1.32, 8.97, 1.18, -0.45, 0.78, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/hIUrt0AsTjw_filtered.json b/annotations_filtered/hIUrt0AsTjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4424255afe160bc1adf42be25bf6361cec1bbdf --- /dev/null +++ b/annotations_filtered/hIUrt0AsTjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.1], [14.0, 14.71], [16.0, 16.04], [17.0, 17.85], [18.0, 18.64], [19.0, 19.74], [22.0, 27.82], [30.0, 30.81], [32.0, 34.21], [35.0, 39.77], [41.0, 41.72], [42.0, 50.75], [52.0, 71.78], [74.0, 77.33], [79.0, 83.47], [85.0, 92.3], [96.0, 101.26], [103.0, 105.26], [106.0, 108.43]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.38, 0.0, 34.53, 30.8, 0.0, 31.67, 29.89, 30.68, 31.95, 31.56, 30.1, 36.97, 32.85], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.63], ["speech", 4.06], ["hum", 2.31]], null, [["mains hum", 44.0], ["hum", 21.7], ["electric shaver, electric razor", 7.24]], [["whack, thwack", 25.72], ["mosquito", 6.04], ["speech", 5.88]], null, [["music", 46.44], ["throbbing", 16.0], ["hum", 15.56]], [["music", 56.11], ["throbbing", 16.65], ["hum", 7.6]], [["throbbing", 27.33], ["hum", 24.42], ["mains hum", 18.62]], [["cattle, bovinae", 45.1], ["moo", 33.43], ["livestock, farm animals, working animals", 15.81]], [["throbbing", 35.3], ["music", 35.03], ["hum", 12.67]], [["music", 68.91], ["hum", 6.03], ["throbbing", 5.73]], [["music", 34.36], ["hum", 19.29], ["mains hum", 10.56]], [["hum", 43.1], ["sidetone", 15.15], ["mains hum", 14.08]]], "duration": [1.1, 0.71, 0.04, 0.85, 0.64, 0.74, 5.82, 0.81, 2.21, 4.77, 0.72, 8.75, 19.78, 3.33, 4.47, 7.3, 5.26, 2.26, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/hImAmM5-Fpg_filtered.json b/annotations_filtered/hImAmM5-Fpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1c6347ac0d68fb0b2f691087763125aa8ae1ea6 --- /dev/null +++ b/annotations_filtered/hImAmM5-Fpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.13], [5.0, 6.79], [8.0, 12.28], [13.0, 15.96], [18.0, 18.06], [22.0, 22.4], [23.0, 23.62], [35.0, 35.48], [37.0, 40.66], [47.0, 48.34]], "keep_status": [false, false, true, true, false, false, false, false, false, false], "silence_prob": [87.0, 0.0, 32.07, 32.65, 0.0, 0.0, 0.0, 0.0, 39.47, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 18.35], ["moo", 13.38], ["didgeridoo", 12.61]], [["speech", 40.79], ["music", 5.88], ["cattle, bovinae", 5.82]], null, null, null, null, [["hum", 31.85], ["mains hum", 30.11], ["music", 16.12]], null], "duration": [2.13, 1.79, 4.28, 2.96, 0.06, 0.4, 0.62, 0.48, 3.66, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/hIoCskqjp9c_filtered.json b/annotations_filtered/hIoCskqjp9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a72736c00551a379062622d7714abd3e0176ce41 --- /dev/null +++ b/annotations_filtered/hIoCskqjp9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.21], [37.0, 38.5], [39.0, 40.86], [44.0, 46.13], [49.0, 51.48], [53.0, 54.23], [56.0, 74.6], [76.0, 83.0], [84.0, 86.64], [87.0, 87.93], [90.0, 89.78], [100.0, 100.77], [102.0, 103.54], [106.0, 106.91], [108.0, 109.11], [113.0, 113.16], [114.0, 114.54], [117.0, 118.13], [119.0, 119.6], [121.0, 121.05], [139.0, 139.31], [141.0, 140.95], [142.0, 141.88], [144.0, 144.49], [152.0, 153.87]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.03, 0.0, 0.0, 99.36, 46.94, 0.0, 42.02, 32.93, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 38.66], ["music", 10.83], ["vehicle", 5.09]], null, null, null, [["speech", 51.92], ["dial tone", 10.35], ["sidetone", 4.5]], null, [["radio", 59.71], ["music", 10.32], ["sidetone", 7.04]], [["civil defense siren", 25.68], ["noise", 19.78], ["siren", 12.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.21, 1.5, 1.86, 2.13, 2.48, 1.23, 18.6, 7.0, 2.64, 0.93, -0.22, 0.77, 1.54, 0.91, 1.11, 0.16, 0.54, 1.13, 0.6, 0.05, 0.31, -0.05, -0.12, 0.49, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/hIokX-nhQd8_filtered.json b/annotations_filtered/hIokX-nhQd8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bb43f3106c1090011395a43d1f705e4d12619be --- /dev/null +++ b/annotations_filtered/hIokX-nhQd8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.8], [16.0, 16.29], [41.0, 41.22], [43.0, 43.71], [47.0, 55.44], [57.0, 57.57], [59.0, 60.32], [63.0, 63.26], [65.0, 66.78], [72.0, 73.45], [77.0, 78.38], [81.0, 82.36], [84.0, 84.13], [86.0, 86.91], [88.0, 88.37], [89.0, 90.17], [92.0, 93.29], [95.0, 95.1], [97.0, 96.99], [99.0, 101.31], [103.0, 103.32], [105.0, 105.66], [108.0, 113.76], [114.0, 115.69], [117.0, 119.64], [121.0, 122.86], [124.0, 124.95], [126.0, 127.13], [130.0, 132.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.56, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 98.01, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [[["bouncing", 30.15], ["speech", 9.2], ["noise", 6.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.8, 0.29, 0.22, 0.71, 8.44, 0.57, 1.32, 0.26, 1.78, 1.45, 1.38, 1.36, 0.13, 0.91, 0.37, 1.17, 1.29, 0.1, -0.01, 2.31, 0.32, 0.66, 5.76, 1.69, 2.64, 1.86, 0.95, 1.13, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/hJErQ3vUD24_filtered.json b/annotations_filtered/hJErQ3vUD24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f1152ea3670bb6fbaae0b2129899c596ab5a4f4 --- /dev/null +++ b/annotations_filtered/hJErQ3vUD24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 80.35], [81.0, 94.76], [95.0, 95.91], [97.0, 97.02], [97.0, 163.51]], "keep_status": [true, true, false, false, false], "silence_prob": [44.07, 30.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 25.76], ["music", 20.31], ["gong", 11.85]], [["music", 20.09], ["screaming", 14.02], ["groan", 12.55]], null, null, null], "duration": [18.35, 13.76, 0.91, 0.02, 66.51]} \ No newline at end of file diff --git a/annotations_filtered/hJUtiOm9dLY_filtered.json b/annotations_filtered/hJUtiOm9dLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e925f2136ebd7ae45cd71adee98d0d6907bb585 --- /dev/null +++ b/annotations_filtered/hJUtiOm9dLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [5.0, 5.48], [8.0, 9.31], [11.0, 11.75], [16.0, 17.29], [18.0, 21.0], [21.0, 25.62], [27.0, 27.97], [29.0, 30.99], [33.0, 36.0], [36.0, 38.47], [41.0, 63.46], [67.0, 66.77], [68.0, 68.76], [71.0, 72.25], [73.0, 75.27], [77.0, 77.63], [85.0, 85.7], [88.0, 88.59], [92.0, 91.98], [113.0, 115.74], [119.0, 120.85], [124.0, 128.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 59.68, 0.0, 0.0, 100.0, 97.33, 100.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.48, 1.31, 0.75, 1.29, 3.0, 4.62, 0.97, 1.99, 3.0, 2.47, 22.46, -0.23, 0.76, 1.25, 2.27, 0.63, 0.7, 0.59, -0.02, 2.74, 1.85, 4.01]} \ No newline at end of file diff --git a/annotations_filtered/hJVXg1AHQTY_filtered.json b/annotations_filtered/hJVXg1AHQTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..254a49583361da4d34cfbcd30ea35063b33f8f53 --- /dev/null +++ b/annotations_filtered/hJVXg1AHQTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [12.0, 13.78], [18.0, 19.58], [23.0, 23.6], [30.0, 31.19], [32.0, 32.51], [55.0, 57.18], [58.0, 59.27], [63.0, 64.72], [68.0, 68.88], [74.0, 74.61], [79.0, 85.13], [85.0, 86.78], [88.0, 89.88], [90.0, 91.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 1.78, 1.58, 0.6, 1.19, 0.51, 2.18, 1.27, 1.72, 0.88, 0.61, 6.13, 1.78, 1.88, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/hJYfFD_MNoY_filtered.json b/annotations_filtered/hJYfFD_MNoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..455b28655b0f635a787aa0d7354c251e2de1278e --- /dev/null +++ b/annotations_filtered/hJYfFD_MNoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.76], [4.0, 5.22], [6.0, 7.74], [10.0, 9.76], [11.0, 12.82], [14.0, 13.73], [16.0, 21.9], [23.0, 22.94], [25.0, 26.64], [27.0, 29.61], [34.0, 36.76], [38.0, 38.55], [43.0, 43.24], [49.0, 49.89], [53.0, 55.38], [57.0, 57.23], [59.0, 60.64], [65.0, 64.94], [68.0, 68.59], [69.0, 69.84], [77.0, 77.48], [79.0, 79.49], [84.0, 84.84], [86.0, 85.95], [89.0, 90.26], [94.0, 97.53], [98.0, 98.85], [101.0, 102.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 98.1, 82.61, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 1.22, 1.74, -0.24, 1.82, -0.27, 5.9, -0.06, 1.64, 2.61, 2.76, 0.55, 0.24, 0.89, 2.38, 0.23, 1.64, -0.06, 0.59, 0.84, 0.48, 0.49, 0.84, -0.05, 1.26, 3.53, 0.85, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/hJckGOSkTG0_filtered.json b/annotations_filtered/hJckGOSkTG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3a10b268aea1a8140d5329af87beabb21e47938 --- /dev/null +++ b/annotations_filtered/hJckGOSkTG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.2], [5.0, 6.12], [11.0, 12.92], [20.0, 20.56], [27.0, 27.31], [30.0, 29.94], [34.0, 36.64], [39.0, 38.96], [41.0, 41.12], [50.0, 50.7], [57.0, 58.26], [60.0, 60.32], [61.0, 62.95], [82.0, 84.81], [86.0, 89.16], [91.0, 95.1], [96.0, 96.92], [98.0, 98.31], [100.0, 99.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 50.91, 60.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.44], ["musical instrument", 6.37], ["guitar", 1.84]], null, null, null, null, null], "duration": [0.2, 1.12, 1.92, 0.56, 0.31, -0.06, 2.64, -0.04, 0.12, 0.7, 1.26, 0.32, 1.95, 2.81, 3.16, 4.1, 0.92, 0.31, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/hK2bLlVeh-w_filtered.json b/annotations_filtered/hK2bLlVeh-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..085e6c09f1faf784194edf837336ca25b081377d --- /dev/null +++ b/annotations_filtered/hK2bLlVeh-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [6.0, 7.23], [11.0, 17.41], [25.0, 28.58], [30.0, 50.04], [51.0, 51.43], [55.0, 56.4], [57.0, 57.94], [60.0, 60.99], [63.0, 66.33], [68.0, 68.08], [70.0, 69.87], [75.0, 76.55], [78.0, 79.24], [81.0, 81.82], [83.0, 87.54], [90.0, 103.22], [104.0, 103.91], [104.0, 109.97], [110.0, 118.23], [119.0, 119.31], [121.0, 121.58], [124.0, 126.15], [128.0, 127.8], [132.0, 132.22], [133.0, 134.15], [135.0, 145.03], [147.0, 148.04], [148.0, 148.9], [150.0, 151.9], [153.0, 158.18]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.47, 30.41, 31.23, 0.0, 0.0, 0.0, 0.0, 40.79, 0.0, 0.0, 0.0, 0.0, 0.0, 53.84, 32.7, 0.0, 72.01, 38.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["music", 22.97], ["smash, crash", 16.48], ["throbbing", 16.28]], [["music", 41.45], ["speech", 12.08], ["breaking", 6.66]], [["music", 37.8], ["sidetone", 18.6], ["speech", 11.98]], null, null, null, null, [["music", 56.84], ["speech", 21.01], ["hum", 2.39]], null, null, null, null, null, null, [["music", 73.7], ["speech", 8.81], ["throbbing", 3.02]], null, null, [["speech", 75.8], ["music", 2.77], ["sidetone", 2.7]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.23, 6.41, 3.58, 20.04, 0.43, 1.4, 0.94, 0.99, 3.33, 0.08, -0.13, 1.55, 1.24, 0.82, 4.54, 13.22, -0.09, 5.97, 8.23, 0.31, 0.58, 2.15, -0.2, 0.22, 1.15, 10.03, 1.04, 0.9, 1.9, 5.18]} \ No newline at end of file diff --git a/annotations_filtered/hKBHte0cc_0_filtered.json b/annotations_filtered/hKBHte0cc_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5db3d4342c16cbd4f826753f95383231c4baa27 --- /dev/null +++ b/annotations_filtered/hKBHte0cc_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.99], [13.0, 14.64], [17.0, 17.51], [19.0, 19.57], [21.0, 21.39], [24.0, 29.64], [36.0, 38.01], [39.0, 40.2], [44.0, 44.17], [44.0, 45.22], [52.0, 52.49], [57.0, 57.15], [66.0, 65.92], [66.0, 66.26], [66.0, 67.56], [68.0, 69.6], [72.0, 78.16], [84.0, 86.88], [91.0, 90.9], [91.0, 91.88], [97.0, 97.16], [103.0, 102.95], [104.0, 110.52], [112.0, 113.98], [114.0, 115.16], [117.0, 117.09], [120.0, 119.94]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.53, 68.15, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.34], ["musical instrument", 7.32], ["speech", 4.89]], null, null, null, null, null, null, null, null, null, [["cello", 24.33], ["music", 23.46], ["bowed string instrument", 11.89]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 1.64, 0.51, 0.57, 0.39, 5.64, 2.01, 1.2, 0.17, 1.22, 0.49, 0.15, -0.08, 0.26, 1.56, 1.6, 6.16, 2.88, -0.1, 0.88, 0.16, -0.05, 6.52, 1.98, 1.16, 0.09, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/hKNSpQwCIdA_filtered.json b/annotations_filtered/hKNSpQwCIdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04d597b9ab2c81fb5cdf4c026d8aba8d30d97cb2 --- /dev/null +++ b/annotations_filtered/hKNSpQwCIdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.09], [1.0, 1.19], [1.0, 1.24], [2.0, 6.39], [7.0, 9.59], [11.0, 16.55], [17.0, 22.6], [24.0, 29.56], [35.0, 42.7], [46.0, 46.23], [47.0, 76.94], [77.0, 95.39], [98.0, 107.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.43, 89.72, 82.07, 89.36, 90.78, 98.19, 0.0, 96.77, 87.74, 80.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.19, 0.24, 4.39, 2.59, 5.55, 5.6, 5.56, 7.7, 0.23, 29.94, 18.39, 9.01]} \ No newline at end of file diff --git a/annotations_filtered/hKNeFHBPgRo_filtered.json b/annotations_filtered/hKNeFHBPgRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa01a8d1efd6a589a3b0a187e0696c072bcac86f --- /dev/null +++ b/annotations_filtered/hKNeFHBPgRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [5.0, 6.12], [7.0, 9.88], [11.0, 11.85], [18.0, 19.26], [20.0, 21.14], [22.0, 22.03], [23.0, 25.68], [28.0, 28.93], [31.0, 33.24], [39.0, 40.34], [42.0, 45.59], [47.0, 47.49], [50.0, 50.3], [60.0, 60.94], [82.0, 82.53], [90.0, 90.75], [93.0, 92.91], [99.0, 98.83], [105.0, 106.57], [111.0, 111.57], [113.0, 113.61], [117.0, 120.31], [121.0, 122.27], [125.0, 126.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0, 94.95, 0.0, 37.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 49.73], ["sidetone", 18.99], ["radio", 9.98]], null, null, null, [["music", 15.0], ["speech", 10.77], ["knock", 10.01]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 1.12, 2.88, 0.85, 1.26, 1.14, 0.03, 2.68, 0.93, 2.24, 1.34, 3.59, 0.49, 0.3, 0.94, 0.53, 0.75, -0.09, -0.17, 1.57, 0.57, 0.61, 3.31, 1.27, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/hKSscAR4cS8_filtered.json b/annotations_filtered/hKSscAR4cS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05b6428debebee4de9f3f34ab4fd75fa214966fc --- /dev/null +++ b/annotations_filtered/hKSscAR4cS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [8.0, 8.24], [13.0, 18.5], [21.0, 20.73], [22.0, 45.57], [49.0, 52.79], [55.0, 55.9], [57.0, 58.01], [59.0, 68.94], [69.0, 77.72], [82.0, 85.87], [87.0, 100.63], [110.0, 112.01], [115.0, 144.37]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 0.0, 39.08, 0.0, 37.22, 49.13, 0.0, 0.0, 34.37, 37.19, 52.16, 33.57, 46.64, 38.42], "audiomae_on_audioset": [null, null, [["music", 58.86], ["hum", 6.43], ["mains hum", 6.26]], null, [["music", 72.23], ["buzz", 2.05], ["hum", 1.99]], [["hum", 31.38], ["mains hum", 14.22], ["music", 12.31]], null, null, [["speech", 21.06], ["music", 12.51], ["glass", 7.34]], [["hum", 30.78], ["speech", 15.31], ["mains hum", 15.04]], null, [["music", 31.41], ["hum", 23.1], ["throbbing", 14.11]], [["music", 55.44], ["didgeridoo", 10.22], ["musical instrument", 4.9]], [["music", 31.27], ["breaking", 13.64], ["hum", 11.72]]], "duration": [0.6, 0.24, 5.5, -0.27, 23.57, 3.79, 0.9, 1.01, 9.94, 8.72, 3.87, 13.63, 2.01, 29.37]} \ No newline at end of file diff --git a/annotations_filtered/hKoYPfcWpcU_filtered.json b/annotations_filtered/hKoYPfcWpcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fe3a78fdf6f6e2936c71a3ce60f7e69432d183f --- /dev/null +++ b/annotations_filtered/hKoYPfcWpcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [6.0, 5.8], [6.0, 6.89], [8.0, 7.6], [8.0, 8.26], [9.0, 9.22], [12.0, 13.26], [15.0, 15.55], [16.0, 18.23], [20.0, 21.88], [24.0, 25.66], [28.0, 29.3], [32.0, 34.99], [36.0, 49.0], [49.0, 54.62], [55.0, 64.45], [66.0, 81.36], [82.0, 126.62], [128.0, 129.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 0.0, 97.11, 96.42, 99.21, 89.19, 99.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, -0.2, 0.89, -0.4, 0.26, 0.22, 1.26, 0.55, 2.23, 1.88, 1.66, 1.3, 2.99, 13.0, 5.62, 9.45, 15.36, 44.62, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/hKqQSFaX4NQ_filtered.json b/annotations_filtered/hKqQSFaX4NQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1290878120361733ebf9e386b4ab38b0640f6b08 --- /dev/null +++ b/annotations_filtered/hKqQSFaX4NQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.57], [7.0, 13.54], [15.0, 17.52], [25.0, 38.26], [52.0, 52.46], [54.0, 54.7], [60.0, 61.99], [67.0, 68.74], [71.0, 71.86], [73.0, 73.06], [73.0, 73.58], [75.0, 77.68], [79.0, 79.86], [83.0, 83.89], [85.0, 92.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.53, 71.14, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, [["music", 45.76], ["theremin", 15.28], ["didgeridoo", 10.72]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 6.54, 2.52, 13.26, 0.46, 0.7, 1.99, 1.74, 0.86, 0.06, 0.58, 2.68, 0.86, 0.89, 7.52]} \ No newline at end of file diff --git a/annotations_filtered/hKr4-rNmLFo_filtered.json b/annotations_filtered/hKr4-rNmLFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..738d2c6fe6a56d455a9a077133a8035ef3e09f2d --- /dev/null +++ b/annotations_filtered/hKr4-rNmLFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.9], [2.0, 2.79], [3.0, 13.68], [15.0, 16.56], [19.0, 20.71], [21.0, 21.69], [22.0, 24.26], [27.0, 29.27], [35.0, 34.72], [35.0, 35.45], [36.0, 38.52], [40.0, 41.15], [47.0, 60.05], [61.0, 114.99], [116.0, 134.45], [136.0, 233.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 71.14, 88.83, 0.0, 0.0, 76.53, 0.0, 85.72, 0.0, 37.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.27], ["hum", 18.64], ["throbbing", 6.16]], null], "duration": [-0.1, 0.79, 10.68, 1.56, 1.71, 0.69, 2.26, 2.27, -0.28, 0.45, 2.52, 1.15, 13.05, 53.99, 18.45, 97.95]} \ No newline at end of file diff --git a/annotations_filtered/hKuh_h2nzN8_filtered.json b/annotations_filtered/hKuh_h2nzN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e4eb848b148bcb07fc9413a7c0e8be6425e4df --- /dev/null +++ b/annotations_filtered/hKuh_h2nzN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 68.71], [70.0, 75.03], [78.0, 82.39], [84.0, 88.05], [96.0, 97.7], [98.0, 100.26], [102.0, 102.69], [104.0, 103.86], [107.0, 144.26], [148.0, 148.59]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [28.06, 31.11, 36.98, 35.17, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 81.69], ["electronic music", 1.5], ["song", 0.92]], [["speech", 40.01], ["crowd", 13.15], ["outside, urban or manmade", 4.97]], [["cattle, bovinae", 42.06], ["moo", 38.43], ["livestock, farm animals, working animals", 19.13]], [["speech", 16.93], ["sheep", 11.03], ["bleat", 6.1]], null, null, null, null, null, null], "duration": [23.71, 5.03, 4.39, 4.05, 1.7, 2.26, 0.69, -0.14, 37.26, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/hKvpF7ACDBo_filtered.json b/annotations_filtered/hKvpF7ACDBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87382c99c7127bb802bdc7e8e457e58d681108e9 --- /dev/null +++ b/annotations_filtered/hKvpF7ACDBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.54], [8.0, 9.96], [11.0, 13.37], [14.0, 16.06], [17.0, 24.04], [25.0, 29.57], [30.0, 31.01], [33.0, 42.58], [49.0, 52.15], [69.0, 71.37]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 97.83, 62.89, 70.44, 67.76, 0.0, 73.67, 39.98, 56.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 16.31], ["insect", 9.15], ["bee, wasp, etc.", 7.66]], null], "duration": [1.54, 1.96, 2.37, 2.06, 7.04, 4.57, 1.01, 9.58, 3.15, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/hL71tkydKPM_filtered.json b/annotations_filtered/hL71tkydKPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..035b363a697537817c8341860d476d7aae89acc4 --- /dev/null +++ b/annotations_filtered/hL71tkydKPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.21], [12.0, 12.83], [14.0, 14.72], [17.0, 17.15], [19.0, 19.74], [23.0, 32.78], [43.0, 46.35], [49.0, 50.5], [51.0, 51.43], [55.0, 58.06]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [36.51, 0.0, 0.0, 0.0, 0.0, 30.93, 30.42, 0.0, 0.0, 29.87], "audiomae_on_audioset": [[["music", 40.32], ["hum", 16.24], ["mains hum", 9.74]], null, null, null, null, [["music", 55.78], ["reggae", 10.66], ["speech", 7.16]], [["music", 68.43], ["reggae", 2.04], ["musical instrument", 1.8]], null, null, [["music", 74.45], ["swing music", 2.85], ["ska", 2.21]]], "duration": [8.21, 0.83, 0.72, 0.15, 0.74, 9.78, 3.35, 1.5, 0.43, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/hLCjV1eOAoA_filtered.json b/annotations_filtered/hLCjV1eOAoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72b5a97c8d11924f5de54241fdf6f267380f6a1e --- /dev/null +++ b/annotations_filtered/hLCjV1eOAoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [2.0, 2.07], [2.0, 6.32], [7.0, 7.01], [10.0, 9.73], [11.0, 11.75], [17.0, 17.63], [19.0, 20.55], [25.0, 24.76], [25.0, 25.39], [27.0, 27.4], [32.0, 32.51], [45.0, 45.45], [52.0, 52.93], [85.0, 86.0]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 57.38], ["music", 4.9], ["burping, eructation", 4.27]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.03, 0.07, 4.32, 0.01, -0.27, 0.75, 0.63, 1.55, -0.24, 0.39, 0.4, 0.51, 0.45, 0.93, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/hLNZCf1nuRo_filtered.json b/annotations_filtered/hLNZCf1nuRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5138a144f6e46c0e188ed487f92875ab1118f361 --- /dev/null +++ b/annotations_filtered/hLNZCf1nuRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.23], [14.0, 15.74]], "keep_status": [false, false], "silence_prob": [51.23, 0.0], "audiomae_on_audioset": [null, null], "duration": [6.23, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/hLQQfSmgoGY_filtered.json b/annotations_filtered/hLQQfSmgoGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a060ade5a60920673bb6408644a1d66ac93b22f4 --- /dev/null +++ b/annotations_filtered/hLQQfSmgoGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 32.81], [34.0, 49.15], [50.0, 63.63], [67.0, 66.93], [73.0, 73.95], [74.0, 74.58], [75.0, 75.78], [77.0, 86.21]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.61, 34.08, 0.0, 0.0, 0.0, 0.0, 32.9], "audiomae_on_audioset": [null, [["music", 73.48], ["theremin", 12.9], ["synthesizer", 3.69]], [["music", 63.47], ["noise", 4.58], ["theremin", 3.78]], null, null, null, null, [["music", 22.28], ["hum", 17.73], ["mains hum", 15.67]]], "duration": [31.81, 15.15, 13.63, -0.07, 0.95, 0.58, 0.78, 9.21]} \ No newline at end of file diff --git a/annotations_filtered/hLUSwJuMjWo_filtered.json b/annotations_filtered/hLUSwJuMjWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6cfddbf652a0bc041bd0b3744d3873b16df80f9 --- /dev/null +++ b/annotations_filtered/hLUSwJuMjWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 48.71], [51.0, 50.73], [51.0, 52.57], [53.0, 52.69], [53.0, 53.0], [57.0, 60.32], [65.0, 65.11], [67.0, 67.61], [68.0, 68.96], [70.0, 70.85], [73.0, 74.36], [76.0, 76.18], [77.0, 78.7], [81.0, 84.99]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [34.27, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.2], "audiomae_on_audioset": [[["hum", 43.3], ["music", 19.49], ["throbbing", 19.34]], null, null, null, null, [["music", 15.91], ["sine wave", 12.68], ["hum", 10.63]], null, null, null, null, null, null, null, [["mains hum", 33.4], ["speech", 16.36], ["music", 9.93]]], "duration": [15.71, -0.27, 1.57, -0.31, 0.0, 3.32, 0.11, 0.61, 0.96, 0.85, 1.36, 0.18, 1.7, 3.99]} \ No newline at end of file diff --git a/annotations_filtered/hLbozjgBIE0_filtered.json b/annotations_filtered/hLbozjgBIE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2d727314cb6b81daae63d9942911853ae8f866a --- /dev/null +++ b/annotations_filtered/hLbozjgBIE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.15], [16.0, 21.44], [23.0, 24.61], [25.0, 26.55], [27.0, 33.15], [35.0, 37.39], [38.0, 40.41], [43.0, 44.41], [47.0, 51.41], [53.0, 56.91], [59.0, 60.29], [61.0, 63.63], [65.0, 67.07], [70.0, 70.98], [73.0, 75.03], [77.0, 77.95], [82.0, 86.26], [87.0, 89.13], [90.0, 94.22], [97.0, 97.7], [100.0, 101.01], [104.0, 104.7], [107.0, 108.04], [110.0, 110.56], [111.0, 113.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 99.91, 0.0, 0.0, 99.05, 97.33, 90.43, 0.0, 99.52, 99.98, 0.0, 97.0, 95.64, 0.0, 99.98, 0.0, 99.88, 99.84, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 5.44, 1.61, 1.55, 6.15, 2.39, 2.41, 1.41, 4.41, 3.91, 1.29, 2.63, 2.07, 0.98, 2.03, 0.95, 4.26, 2.13, 4.22, 0.7, 1.01, 0.7, 1.04, 0.56, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/hLrM7OaMTGg_filtered.json b/annotations_filtered/hLrM7OaMTGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62ebe39636ab65ca2b0755117cf8c3a2aac011e9 --- /dev/null +++ b/annotations_filtered/hLrM7OaMTGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [4.0, 5.05], [6.0, 10.71], [15.0, 15.79], [16.0, 16.48], [25.0, 30.01], [30.0, 30.92], [35.0, 36.42], [38.0, 42.35], [50.0, 54.31], [55.0, 56.29], [56.0, 73.16], [74.0, 74.92], [82.0, 85.67], [86.0, 85.7], [90.0, 90.81], [92.0, 93.11], [93.0, 96.57], [99.0, 98.81], [108.0, 111.55], [126.0, 128.88]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 55.96, 0.0, 0.0, 50.06, 0.0, 0.0, 41.07, 44.84, 0.0, 54.3, 0.0, 31.59, 0.0, 0.0, 0.0, 39.54, 0.0, 43.74, 52.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 42.17], ["throbbing", 8.48], ["synthesizer", 5.44]], [["music", 32.92], ["synthesizer", 13.94], ["drum machine", 13.35]], null, null, null, [["speech", 56.82], ["music", 14.81], ["boing", 5.08]], null, null, null, [["speech", 60.48], ["music", 10.06], ["percussion", 2.14]], null, [["music", 22.49], ["speech", 15.45], ["animal", 2.86]], null], "duration": [1.43, 1.05, 4.71, 0.79, 0.48, 5.01, 0.92, 1.42, 4.35, 4.31, 1.29, 17.16, 0.92, 3.67, -0.3, 0.81, 1.11, 3.57, -0.19, 3.55, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/hM1OunX-QBg_filtered.json b/annotations_filtered/hM1OunX-QBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f17d015c54bbf9e41771fb2d14ecad3370d6337 --- /dev/null +++ b/annotations_filtered/hM1OunX-QBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 83.88], [85.0, 84.94], [85.0, 90.88], [92.0, 100.38], [106.0, 128.95]], "keep_status": [false, false, true, true, false], "silence_prob": [31.25, 0.0, 31.23, 29.42, 29.88], "audiomae_on_audioset": [[["speech", 35.27], ["music", 30.19], ["quack", 7.77]], null, [["hum", 27.13], ["speech", 19.95], ["throbbing", 15.43]], [["music", 38.14], ["speech", 11.73], ["burst, pop", 4.57]], [["speech", 36.29], ["music", 33.69], ["gunshot, gunfire", 4.78]]], "duration": [4.88, -0.06, 5.88, 8.38, 22.95]} \ No newline at end of file diff --git a/annotations_filtered/hM3nn30NxCE_filtered.json b/annotations_filtered/hM3nn30NxCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6574311a9231b2d2a7940745ec1949568a11798 --- /dev/null +++ b/annotations_filtered/hM3nn30NxCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [13.0, 13.02], [17.0, 18.13], [22.0, 22.03], [24.0, 24.85], [26.0, 27.09], [44.0, 44.41], [69.0, 69.5], [70.0, 70.46], [79.0, 79.73], [85.0, 85.87], [87.0, 87.1], [91.0, 91.56], [95.0, 95.98], [99.0, 101.44], [108.0, 108.35], [111.0, 124.34], [125.0, 126.45], [126.0, 126.87], [129.0, 133.02], [134.0, 135.78], [136.0, 136.8], [137.0, 138.59], [139.0, 141.84], [142.0, 147.88], [149.0, 148.91], [151.0, 163.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 49.5, 0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 33.6, 36.52, 0.0, 30.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 25.54], ["insect", 11.35], ["frog", 8.6]], null, null, null, null, null, null, [["speech", 26.27], ["whistling", 4.9], ["radio", 4.05]], [["animal", 18.46], ["livestock, farm animals, working animals", 12.53], ["speech", 11.38]], null, [["speech", 12.23], ["animal", 9.1], ["hum", 5.96]]], "duration": [1.01, 0.02, 1.13, 0.03, 0.85, 1.09, 0.41, 0.5, 0.46, 0.73, 0.87, 0.1, 0.56, 0.98, 2.44, 0.35, 13.34, 1.45, 0.87, 4.02, 1.78, 0.8, 1.59, 2.84, 5.88, -0.09, 12.14]} \ No newline at end of file diff --git a/annotations_filtered/hM6ItEXb_Us_filtered.json b/annotations_filtered/hM6ItEXb_Us_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c25aed08c8dda789406cb66f62541b2384acea9f --- /dev/null +++ b/annotations_filtered/hM6ItEXb_Us_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [10.0, 21.86], [25.0, 25.05], [25.0, 38.64], [40.0, 59.02], [63.0, 82.75], [83.0, 97.28], [101.0, 101.09], [102.0, 126.05]], "keep_status": [false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 32.79, 0.0, 31.73, 35.24, 31.38, 43.93, 0.0, 35.11], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 32.42], ["moo", 17.71], ["cattle, bovinae", 14.33]], null, [["music", 39.37], ["vehicle", 11.08], ["livestock, farm animals, working animals", 7.87]], [["music", 74.93], ["throbbing", 3.86], ["smash, crash", 3.19]], [["music", 87.04], ["didgeridoo", 1.42], ["electronic music", 1.25]], [["music", 26.58], ["livestock, farm animals, working animals", 14.82], ["cattle, bovinae", 11.62]], null, [["cattle, bovinae", 57.18], ["moo", 27.34], ["livestock, farm animals, working animals", 15.37]]], "duration": [0.41, 11.86, 0.05, 13.64, 19.02, 19.75, 14.28, 0.09, 24.05]} \ No newline at end of file diff --git a/annotations_filtered/hM6KNsz7_mk_filtered.json b/annotations_filtered/hM6KNsz7_mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44ffd61e75acd39a9ff3107991149161d08dfa1d --- /dev/null +++ b/annotations_filtered/hM6KNsz7_mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.47], [8.0, 9.12], [11.0, 12.58], [14.0, 15.25], [21.0, 21.07], [30.0, 31.41], [33.0, 34.13], [37.0, 37.4], [39.0, 40.42], [42.0, 42.57], [44.0, 47.73], [51.0, 51.33], [56.0, 57.55], [58.0, 58.24], [84.0, 84.43], [86.0, 89.13], [90.0, 91.45], [93.0, 94.22], [105.0, 105.75], [107.0, 107.08], [117.0, 117.64], [121.0, 121.34], [122.0, 122.32], [123.0, 123.16], [125.0, 125.52], [134.0, 134.86], [135.0, 136.32], [141.0, 141.2], [143.0, 143.11], [143.0, 144.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 26.32], ["speech", 20.02], ["electronic music", 14.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.12, 1.58, 1.25, 0.07, 1.41, 1.13, 0.4, 1.42, 0.57, 3.73, 0.33, 1.55, 0.24, 0.43, 3.13, 1.45, 1.22, 0.75, 0.08, 0.64, 0.34, 0.32, 0.16, 0.52, 0.86, 1.32, 0.2, 0.11, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/hMGHJFVuqpg_filtered.json b/annotations_filtered/hMGHJFVuqpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d027acd110c88820a225f85f7f94c901af5d387 --- /dev/null +++ b/annotations_filtered/hMGHJFVuqpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.28], [21.0, 21.96], [23.0, 25.08], [27.0, 27.01], [33.0, 34.06], [35.0, 36.26], [37.0, 38.1], [39.0, 60.72], [61.0, 85.7], [88.0, 98.88], [102.0, 102.46], [105.0, 108.21], [114.0, 133.68], [134.0, 148.59], [151.0, 158.08], [160.0, 167.46], [171.0, 172.47], [175.0, 182.31], [184.0, 186.81], [190.0, 199.12], [200.0, 202.86], [203.0, 204.58], [205.0, 206.81], [210.0, 214.59], [218.0, 221.21], [226.0, 228.78], [233.0, 235.48], [238.0, 238.01], [241.0, 245.49], [248.0, 252.83], [254.0, 259.17], [263.0, 265.69]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 0.0, 34.68, 34.55, 33.64, 0.0, 36.2, 35.66, 30.97, 31.35, 33.99, 0.0, 31.94, 32.15, 46.29, 42.62, 0.0, 0.0, 72.01, 43.79, 85.54, 93.29, 0.0, 73.51, 48.44, 41.78, 72.31], "audiomae_on_audioset": [null, null, [["music", 45.19], ["throbbing", 7.36], ["hum", 6.57]], null, null, null, null, [["music", 71.44], ["speech", 5.61], ["theremin", 5.17]], [["music", 44.2], ["buzz", 18.5], ["speech", 6.84]], [["music", 49.59], ["speech", 11.38], ["hum", 5.08]], null, [["throbbing", 53.96], ["music", 32.6], ["hum", 5.02]], [["music", 67.38], ["throbbing", 4.96], ["hum", 4.72]], [["music", 61.5], ["throbbing", 12.8], ["hum", 3.27]], [["music", 40.9], ["throbbing", 7.58], ["hum", 6.95]], [["music", 35.59], ["hum", 27.24], ["mains hum", 15.1]], null, [["music", 39.44], ["speech", 21.0], ["throbbing", 7.9]], [["speech", 15.41], ["vehicle", 7.51], ["cattle, bovinae", 6.16]], [["music", 59.83], ["ambient music", 11.81], ["electronic music", 5.5]], [["ambient music", 34.0], ["music", 32.98], ["synthesizer", 7.32]], null, null, null, [["music", 68.58], ["synthesizer", 2.47], ["keyboard (musical)", 2.27]], null, null, null, null, [["music", 43.71], ["electric piano", 7.28], ["piano", 5.96]], [["music", 74.23], ["singing", 4.84], ["lullaby", 2.57]], null], "duration": [0.28, 0.96, 2.08, 0.01, 1.06, 1.26, 1.1, 21.72, 24.7, 10.88, 0.46, 3.21, 19.68, 14.59, 7.08, 7.46, 1.47, 7.31, 2.81, 9.12, 2.86, 1.58, 1.81, 4.59, 3.21, 2.78, 2.48, 0.01, 4.49, 4.83, 5.17, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/hMMAB3MNCKw_filtered.json b/annotations_filtered/hMMAB3MNCKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6309b921eb627e830e4fd5af5ea1b20f455ae25 --- /dev/null +++ b/annotations_filtered/hMMAB3MNCKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [3.0, 5.19], [6.0, 7.32], [9.0, 10.47], [11.0, 12.88], [18.0, 19.82], [25.0, 25.15], [36.0, 36.9], [44.0, 49.0], [60.0, 61.82], [62.0, 62.11], [64.0, 64.3], [67.0, 77.21], [78.0, 82.29], [83.0, 96.9], [99.0, 110.74], [111.0, 113.51], [114.0, 180.84], [181.0, 181.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 91.98, 53.04, 70.72, 37.96, 42.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.59], ["musical instrument", 6.13], ["clarinet", 4.18]], [["music", 42.19], ["musical instrument", 6.93], ["saxophone", 6.12]], null, null], "duration": [0.35, 2.19, 1.32, 1.47, 1.88, 1.82, 0.15, 0.9, 5.0, 1.82, 0.11, 0.3, 10.21, 4.29, 13.9, 11.74, 2.51, 66.84, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/hMW3GQ2x79Q_filtered.json b/annotations_filtered/hMW3GQ2x79Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..762a98f687eff51258164a308ae9271dc3e068d4 --- /dev/null +++ b/annotations_filtered/hMW3GQ2x79Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 28.93], [42.0, 64.13], [78.0, 78.16], [79.0, 101.09], [104.0, 116.16], [119.0, 120.07], [122.0, 128.78]], "keep_status": [false, true, false, true, false, false, false], "silence_prob": [29.03, 29.31, 0.0, 29.94, 77.53, 0.0, 47.54], "audiomae_on_audioset": [[["music", 46.94], ["noise", 17.49], ["theremin", 6.8]], [["music", 26.82], ["hum", 16.52], ["throbbing", 15.44]], null, [["music", 29.62], ["hum", 8.11], ["motorcycle", 7.35]], null, null, [["insect", 39.8], ["fly, housefly", 39.03], ["mosquito", 6.42]]], "duration": [28.93, 22.13, 0.16, 22.09, 12.16, 1.07, 6.78]} \ No newline at end of file diff --git a/annotations_filtered/hMbcMlAVxeg_filtered.json b/annotations_filtered/hMbcMlAVxeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ded20533a58204d923ecdf005a319213c0dc5f1 --- /dev/null +++ b/annotations_filtered/hMbcMlAVxeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.71], [11.0, 12.18], [14.0, 19.21], [21.0, 21.86], [26.0, 27.11], [29.0, 33.51], [34.0, 40.95], [45.0, 50.97], [51.0, 55.7], [58.0, 70.09], [70.0, 72.39], [73.0, 74.43], [75.0, 96.04]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [79.76, 0.0, 85.17, 0.0, 0.0, 42.65, 40.57, 35.18, 35.68, 38.15, 55.31, 0.0, 36.5], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 52.64], ["mains hum", 25.65], ["throbbing", 10.52]], [["hum", 25.48], ["speech", 22.0], ["mains hum", 15.87]], [["hum", 42.84], ["music", 22.25], ["throbbing", 6.8]], [["hum", 56.43], ["mains hum", 20.32], ["throbbing", 8.47]], [["hum", 62.93], ["throbbing", 14.2], ["mains hum", 7.21]], null, null, [["hum", 13.64], ["grunt", 13.19], ["noise", 5.78]]], "duration": [8.71, 1.18, 5.21, 0.86, 1.11, 4.51, 6.95, 5.97, 4.7, 12.09, 2.39, 1.43, 21.04]} \ No newline at end of file diff --git a/annotations_filtered/hN5We42pLhs_filtered.json b/annotations_filtered/hN5We42pLhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d375251d2c76f2aeed50c88e1c289998b6580015 --- /dev/null +++ b/annotations_filtered/hN5We42pLhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 59.73], [76.0, 76.57], [77.0, 83.15], [90.0, 90.56], [92.0, 93.19], [99.0, 99.62], [101.0, 102.54], [103.0, 104.11], [106.0, 107.1], [109.0, 110.1], [111.0, 111.72], [114.0, 114.13], [115.0, 118.66], [124.0, 123.6], [126.0, 126.17], [127.0, 127.65], [129.0, 133.22], [134.0, 136.16], [136.0, 137.73], [139.0, 140.66], [141.0, 150.65], [153.0, 152.95]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [30.97, 0.0, 33.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.68, 0.0, 0.0, 0.0, 41.76, 34.86, 0.0, 0.0, 30.28, 0.0], "audiomae_on_audioset": [[["thunk", 25.42], ["breaking", 14.07], ["music", 12.32]], null, [["music", 55.04], ["speech", 11.53], ["mains hum", 7.87]], null, null, null, null, null, null, null, null, null, [["breaking", 46.67], ["speech", 26.08], ["music", 13.84]], null, null, null, [["music", 36.53], ["singing bowl", 10.5], ["musical instrument", 5.42]], [["music", 48.62], ["speech", 12.87], ["didgeridoo", 8.27]], null, null, [["music", 42.41], ["speech", 32.47], ["didgeridoo", 7.83]], null], "duration": [27.73, 0.57, 6.15, 0.56, 1.19, 0.62, 1.54, 1.11, 1.1, 1.1, 0.72, 0.13, 3.66, -0.4, 0.17, 0.65, 4.22, 2.16, 1.73, 1.66, 9.65, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/hOB4Qm1IiOY_filtered.json b/annotations_filtered/hOB4Qm1IiOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6abb8bf131f33a583a44ff77e73f6a137fc3b73 --- /dev/null +++ b/annotations_filtered/hOB4Qm1IiOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [2.0, 4.89], [9.0, 9.19], [15.0, 16.31], [20.0, 21.49], [25.0, 27.67], [34.0, 35.73], [42.0, 43.9], [47.0, 48.71], [49.0, 49.76], [52.0, 52.81], [55.0, 56.05], [68.0, 68.44], [71.0, 71.25], [74.0, 78.09], [84.0, 85.09], [89.0, 91.62], [94.0, 96.94], [98.0, 102.69], [104.0, 112.04], [113.0, 115.42], [116.0, 116.88], [118.0, 124.48], [127.0, 128.9], [132.0, 138.21], [139.0, 141.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.58, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 47.66, 41.68, 72.31, 68.8, 69.88, 0.0, 74.76, 0.0, 81.35, 84.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.62], ["gong", 21.9], ["singing bowl", 20.09]], [["music", 53.87], ["ambient music", 10.51], ["sonar", 4.83]], null, null, null, null, null, null, null, null], "duration": [0.36, 2.89, 0.19, 1.31, 1.49, 2.67, 1.73, 1.9, 1.71, 0.76, 0.81, 1.05, 0.44, 0.25, 4.09, 1.09, 2.62, 2.94, 4.69, 8.04, 2.42, 0.88, 6.48, 1.9, 6.21, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/hOH-oOCfsX4_filtered.json b/annotations_filtered/hOH-oOCfsX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b9e7837ef5e3bdd8f03a277f3bfca833737c473 --- /dev/null +++ b/annotations_filtered/hOH-oOCfsX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.38], [11.0, 11.47], [12.0, 12.48], [16.0, 19.92], [21.0, 48.51], [53.0, 67.12], [107.0, 157.01], [158.0, 159.54], [162.0, 164.39], [165.0, 168.34]], "keep_status": [true, false, false, true, true, true, false, false, true, true], "silence_prob": [33.71, 0.0, 0.0, 31.08, 34.29, 33.1, 0.0, 0.0, 31.05, 31.75], "audiomae_on_audioset": [[["speech", 47.41], ["creak", 7.09], ["livestock, farm animals, working animals", 6.93]], null, null, [["livestock, farm animals, working animals", 30.6], ["cattle, bovinae", 21.2], ["moo", 12.77]], [["animal", 24.77], ["horse", 20.29], ["clip-clop", 18.36]], [["speech", 37.4], ["clip-clop", 7.17], ["animal", 6.69]], null, null, [["hum", 21.87], ["speech", 16.82], ["throbbing", 16.41]], [["cattle, bovinae", 36.39], ["moo", 14.44], ["livestock, farm animals, working animals", 10.29]]], "duration": [3.38, 0.47, 0.48, 3.92, 27.51, 14.12, 50.01, 1.54, 2.39, 3.34]} \ No newline at end of file diff --git a/annotations_filtered/hONljrAJrH0_filtered.json b/annotations_filtered/hONljrAJrH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..711858f9b4763d6cfd8a5b3de90197a6e9fbfed5 --- /dev/null +++ b/annotations_filtered/hONljrAJrH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.99], [13.0, 13.71], [17.0, 18.67], [20.0, 20.78], [22.0, 29.12], [30.0, 31.83], [32.0, 40.04], [40.0, 40.54], [43.0, 45.39]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.56, 0.0, 34.46, 0.0, 33.63], "audiomae_on_audioset": [null, null, null, null, [["music", 32.13], ["whale vocalization", 31.06], ["carnatic music", 8.42]], null, [["music", 66.26], ["theremin", 20.77], ["musical instrument", 2.92]], null, [["theremin", 53.56], ["music", 30.83], ["musical instrument", 1.63]]], "duration": [1.99, 0.71, 1.67, 0.78, 7.12, 1.83, 8.04, 0.54, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/hOnolgR_8tc_filtered.json b/annotations_filtered/hOnolgR_8tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59fea97f27cd5dbc88546b88872a8e086ad98e28 --- /dev/null +++ b/annotations_filtered/hOnolgR_8tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.5], [9.0, 10.0], [12.0, 13.14], [14.0, 15.5], [17.0, 17.81], [19.0, 19.67], [21.0, 22.91], [25.0, 26.06], [28.0, 29.83], [31.0, 41.93], [43.0, 44.25], [45.0, 46.89], [48.0, 49.6], [52.0, 52.51], [54.0, 55.86], [57.0, 59.26], [61.0, 62.61], [64.0, 64.71], [66.0, 67.37], [69.0, 72.17], [74.0, 74.92], [76.0, 76.52], [77.0, 77.63], [80.0, 81.65], [84.0, 85.13], [87.0, 88.45], [90.0, 96.31], [97.0, 100.21], [101.0, 104.35], [106.0, 108.11], [111.0, 112.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 47.08, 63.53, 63.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.59], ["sidetone", 7.09], ["whale vocalization", 5.44]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 18.97], ["speech", 18.16], ["radio", 15.17]], null, null, null], "duration": [1.5, 1.0, 1.14, 1.5, 0.81, 0.67, 1.91, 1.06, 1.83, 10.93, 1.25, 1.89, 1.6, 0.51, 1.86, 2.26, 1.61, 0.71, 1.37, 3.17, 0.92, 0.52, 0.63, 1.65, 1.13, 1.45, 6.31, 3.21, 3.35, 2.11, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/hOz9L1KrJJY_filtered.json b/annotations_filtered/hOz9L1KrJJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4893c6fa376385ad18996b64be7a383bcf64d43f --- /dev/null +++ b/annotations_filtered/hOz9L1KrJJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.5], [17.0, 16.73], [19.0, 22.64], [26.0, 26.45], [32.0, 34.35], [40.0, 40.73], [43.0, 44.81], [45.0, 46.72], [48.0, 48.24], [49.0, 50.45], [51.0, 55.95], [59.0, 58.92], [61.0, 61.33], [67.0, 67.15], [74.0, 100.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 82.43, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 30.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 52.55], ["music", 12.29], ["roar", 3.35]], null, null, null, [["music", 30.41], ["hum", 17.13], ["speech", 15.12]]], "duration": [0.5, -0.27, 3.64, 0.45, 2.35, 0.73, 1.81, 1.72, 0.24, 1.45, 4.95, -0.08, 0.33, 0.15, 26.99]} \ No newline at end of file diff --git a/annotations_filtered/hP77V2X1Biw_filtered.json b/annotations_filtered/hP77V2X1Biw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56dcb6ec48f988ee3e320d732d3b4238806ce438 --- /dev/null +++ b/annotations_filtered/hP77V2X1Biw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.18], [16.0, 61.97], [65.0, 91.57], [92.0, 94.91]], "keep_status": [false, false, true, false], "silence_prob": [97.11, 0.0, 40.17, 42.37], "audiomae_on_audioset": [null, null, [["radio", 24.08], ["hum", 11.05], ["sidetone", 9.57]], [["mains hum", 38.29], ["hum", 33.3], ["creak", 6.39]]], "duration": [8.18, 45.97, 26.57, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/hPF9nzzuMfo_filtered.json b/annotations_filtered/hPF9nzzuMfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eaea247031247cd25449fc07c4bb48466e268c0 --- /dev/null +++ b/annotations_filtered/hPF9nzzuMfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [6.0, 8.46], [9.0, 10.98], [12.0, 14.01], [15.0, 16.75], [18.0, 22.87], [24.0, 28.07], [30.0, 34.38], [35.0, 34.97], [36.0, 36.9], [39.0, 44.69], [46.0, 48.24], [50.0, 52.54], [55.0, 58.26], [59.0, 65.92], [72.0, 73.8], [77.0, 79.57], [83.0, 83.61], [91.0, 91.56], [93.0, 93.07], [99.0, 99.98], [103.0, 126.47], [127.0, 132.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.1, 0.0, 98.99, 0.0, 98.51, 74.29, 95.91, 0.0, 0.0, 52.22, 90.25, 98.59, 96.42, 44.99, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 96.04, 89.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.97], ["hum", 10.74], ["mains hum", 4.2]], null, null, null, null, null, null, null, null], "duration": [1.67, 2.46, 1.98, 2.01, 1.75, 4.87, 4.07, 4.38, -0.03, 0.9, 5.69, 2.24, 2.54, 3.26, 6.92, 1.8, 2.57, 0.61, 0.56, 0.07, 0.98, 23.47, 5.48]} \ No newline at end of file diff --git a/annotations_filtered/hPmV9DBCrfQ_filtered.json b/annotations_filtered/hPmV9DBCrfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9380e99c4625f4dc835396d90bf7b5e503fb3f15 --- /dev/null +++ b/annotations_filtered/hPmV9DBCrfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.11], [13.0, 14.88], [16.0, 16.71], [21.0, 21.81], [27.0, 29.0], [32.0, 38.25], [40.0, 45.69], [50.0, 58.33], [60.0, 60.54], [64.0, 64.99], [68.0, 69.63], [73.0, 73.62], [75.0, 75.59], [77.0, 77.85], [79.0, 81.01], [86.0, 95.62], [101.0, 114.79], [116.0, 116.99]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.61, 30.62, 30.43, 30.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.48, 29.78, 29.36, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 27.56], ["music", 24.48], ["didgeridoo", 3.19]], [["music", 64.44], ["effects unit", 3.82], ["electronic music", 2.96]], [["music", 68.96], ["throbbing", 5.36], ["electronic music", 3.73]], [["music", 53.11], ["guitar", 4.38], ["musical instrument", 4.06]], null, null, null, null, null, null, [["noise", 14.86], ["mains hum", 13.71], ["hum", 11.69]], [["music", 21.56], ["hum", 21.22], ["mains hum", 7.82]], [["music", 29.94], ["sidetone", 18.4], ["speech", 15.54]], null], "duration": [1.11, 1.88, 0.71, 0.81, 2.0, 6.25, 5.69, 8.33, 0.54, 0.99, 1.63, 0.62, 0.59, 0.85, 2.01, 9.62, 13.79, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/hQCG2AwzTxA_filtered.json b/annotations_filtered/hQCG2AwzTxA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50c6656a10ed95ede4b5fdc75c52817f7d169960 --- /dev/null +++ b/annotations_filtered/hQCG2AwzTxA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.86], [17.0, 30.43], [31.0, 31.67], [33.0, 34.92], [36.0, 37.62], [39.0, 40.1], [41.0, 42.5], [43.0, 43.26], [44.0, 44.76], [46.0, 46.04], [47.0, 48.24], [49.0, 52.69], [53.0, 53.77], [55.0, 55.63], [56.0, 77.99], [79.0, 80.69], [82.0, 82.61], [84.0, 84.43], [87.0, 87.52], [89.0, 90.26], [91.0, 90.78], [92.0, 95.23], [97.0, 97.7], [100.0, 100.55], [102.0, 103.96], [106.0, 108.89], [111.0, 111.1], [111.0, 111.6], [112.0, 114.35], [115.0, 121.27], [122.0, 123.55], [126.0, 126.4], [127.0, 128.14], [129.0, 130.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.11, 37.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 59.68, 35.41, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 64.89], ["telephone", 14.56], ["sidetone", 12.19]], [["music", 53.74], ["hum", 13.58], ["speech", 8.16]], null, null, null, null, null, null, null, null, null, null, null, null, [["frog", 14.76], ["music", 12.92], ["heart sounds, heartbeat", 12.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.25], ["theremin", 5.58], ["hum", 4.85]], null, null, null, null], "duration": [3.86, 13.43, 0.67, 1.92, 1.62, 1.1, 1.5, 0.26, 0.76, 0.04, 1.24, 3.69, 0.77, 0.63, 21.99, 1.69, 0.61, 0.43, 0.52, 1.26, -0.22, 3.23, 0.7, 0.55, 1.96, 2.89, 0.1, 0.6, 2.35, 6.27, 1.55, 0.4, 1.14, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/hQD_fanPkns_filtered.json b/annotations_filtered/hQD_fanPkns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a078c6c7a01f26498ff81b7e2a56b1b963eb08f7 --- /dev/null +++ b/annotations_filtered/hQD_fanPkns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.54], [23.0, 23.11], [30.0, 37.1], [39.0, 45.42], [53.0, 53.3], [54.0, 74.02], [78.0, 78.46], [81.0, 81.58], [82.0, 92.15], [99.0, 101.21], [103.0, 103.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.84, 0.0, 31.22, 31.6, 0.0, 30.83, 0.0, 0.0, 30.76, 37.96, 0.0], "audiomae_on_audioset": [[["music", 59.56], ["speech", 24.36], ["electronic music", 0.91]], null, [["music", 73.22], ["carnatic music", 3.09], ["throbbing", 1.78]], [["music", 82.44], ["electronic music", 1.04], ["musical instrument", 0.94]], null, [["music", 73.02], ["buzz", 3.18], ["musical instrument", 1.97]], null, null, [["music", 54.13], ["speech", 15.25], ["vehicle", 3.99]], [["music", 82.81], ["electronic music", 2.23], ["throbbing", 1.28]], null], "duration": [18.54, 0.11, 7.1, 6.42, 0.3, 20.02, 0.46, 0.58, 10.15, 2.21, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/hQEej75JeUQ_filtered.json b/annotations_filtered/hQEej75JeUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29712fd0fbcd14f6ba7b881dc53235fddbb23647 --- /dev/null +++ b/annotations_filtered/hQEej75JeUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [11.0, 11.53], [24.0, 24.76], [26.0, 29.24], [35.0, 39.65], [40.0, 39.7], [40.0, 46.7], [49.0, 49.65], [52.0, 53.6], [55.0, 59.53], [61.0, 68.34]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.77, 34.14, 0.0, 59.96, 0.0, 0.0, 40.81, 30.15], "audiomae_on_audioset": [null, null, null, [["speech", 51.31], ["fart", 28.17], ["burping, eructation", 11.22]], [["speech", 79.24], ["fart", 2.54], ["sidetone", 2.12]], null, null, null, null, [["sine wave", 10.13], ["cough", 7.8], ["hiccup", 7.35]], [["speech", 65.76], ["groan", 6.33], ["beatboxing", 5.09]]], "duration": [0.07, 0.53, 0.76, 3.24, 4.65, -0.3, 6.7, 0.65, 1.6, 4.53, 7.34]} \ No newline at end of file diff --git a/annotations_filtered/hQIL99lP484_filtered.json b/annotations_filtered/hQIL99lP484_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2020207d29bffea14deeced76f7b23ef3931d5b3 --- /dev/null +++ b/annotations_filtered/hQIL99lP484_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.74], [19.0, 19.26], [30.0, 31.53], [32.0, 32.27], [38.0, 38.72], [40.0, 40.85], [45.0, 50.08], [52.0, 56.64], [63.0, 63.04], [67.0, 72.52], [76.0, 77.25], [80.0, 80.54], [82.0, 82.56], [84.0, 87.54], [92.0, 99.5], [103.0, 105.38], [106.0, 111.16], [115.0, 124.82], [126.0, 131.68], [132.0, 134.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, true], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 54.23, 0.0, 70.02, 0.0, 0.0, 0.0, 65.79, 60.6, 45.69, 33.51, 30.5, 35.2, 36.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.41], ["speech", 7.85], ["theremin", 5.95]], [["speech", 25.99], ["groan", 23.86], ["music", 18.32]], [["music", 23.68], ["vehicle", 22.56], ["car", 15.98]], [["music", 34.16], ["speech", 15.05], ["livestock, farm animals, working animals", 7.08]], [["moo", 18.41], ["music", 17.97], ["speech", 16.36]]], "duration": [2.74, 0.26, 1.53, 0.27, 0.72, 0.85, 5.08, 4.64, 0.04, 5.52, 1.25, 0.54, 0.56, 3.54, 7.5, 2.38, 5.16, 9.82, 5.68, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/hQL6_NbLwtk_filtered.json b/annotations_filtered/hQL6_NbLwtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4db775903cfc777ff4fba7a963904543887d25bc --- /dev/null +++ b/annotations_filtered/hQL6_NbLwtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.37], [14.0, 16.21], [18.0, 18.82], [21.0, 21.25], [24.0, 23.8], [26.0, 25.73], [28.0, 28.81], [35.0, 35.24], [36.0, 36.68], [38.0, 39.95], [42.0, 42.67], [45.0, 45.71], [47.0, 47.7], [49.0, 51.24], [52.0, 53.7], [55.0, 55.53], [57.0, 57.67], [62.0, 69.21], [70.0, 71.63], [73.0, 76.52], [86.0, 86.73], [89.0, 90.66], [92.0, 92.62], [94.0, 94.36], [95.0, 95.28], [97.0, 101.7], [109.0, 109.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 49.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 55.74, 0.0, 31.88, 0.0, 0.0, 0.0, 0.0, 0.0, 35.44, 0.0], "audiomae_on_audioset": [null, [["speech", 50.13], ["sidetone", 19.52], ["hum", 9.14]], null, null, null, null, null, null, null, null, null, null, null, [["noise", 17.31], ["crushing", 16.83], ["dial tone", 12.9]], null, null, null, null, null, [["whack, thwack", 26.59], ["music", 21.64], ["thunk", 6.41]], null, null, null, null, null, [["livestock, farm animals, working animals", 12.9], ["moo", 8.47], ["electric shaver, electric razor", 7.7]], null], "duration": [1.37, 2.21, 0.82, 0.25, -0.2, -0.27, 0.81, 0.24, 0.68, 1.95, 0.67, 0.71, 0.7, 2.24, 1.7, 0.53, 0.67, 7.21, 1.63, 3.52, 0.73, 1.66, 0.62, 0.36, 0.28, 4.7, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/hQUBid6LIPU_filtered.json b/annotations_filtered/hQUBid6LIPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b9694a9094fc8eee7b23fd99a393a1398714ef --- /dev/null +++ b/annotations_filtered/hQUBid6LIPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.56], [34.0, 39.11], [42.0, 43.14], [45.0, 48.05], [51.0, 52.71], [54.0, 57.28], [61.0, 62.99], [64.0, 65.92], [66.0, 67.39], [69.0, 71.24], [74.0, 75.81], [78.0, 84.65], [88.0, 89.85], [92.0, 93.85], [96.0, 99.15], [103.0, 105.33], [107.0, 107.0], [109.0, 111.25], [114.0, 115.84], [117.0, 118.2], [119.0, 120.97], [122.0, 127.01], [128.0, 129.32], [130.0, 131.43], [132.0, 134.72], [136.0, 143.01], [143.0, 151.44], [154.0, 154.95], [159.0, 159.46], [160.0, 162.94], [166.0, 167.85], [169.0, 174.93], [177.0, 183.95], [185.0, 188.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.41, 0.0, 99.92, 0.0, 79.41, 0.0, 0.0, 0.0, 94.37, 0.0, 86.45, 0.0, 0.0, 99.95, 99.95, 0.0, 99.78, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 99.05, 77.2, 93.29, 0.0, 0.0, 56.18, 0.0, 99.96, 99.97, 99.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 5.11, 1.14, 3.05, 1.71, 3.28, 1.99, 1.92, 1.39, 2.24, 1.81, 6.65, 1.85, 1.85, 3.15, 2.33, 0.0, 2.25, 1.84, 1.2, 1.97, 5.01, 1.32, 1.43, 2.72, 7.01, 8.44, 0.95, 0.46, 2.94, 1.85, 5.93, 6.95, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/hQmDmh3qA6s_filtered.json b/annotations_filtered/hQmDmh3qA6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1569b72b3a07196b9422a8aee332d358e3bdaedc --- /dev/null +++ b/annotations_filtered/hQmDmh3qA6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 40.24], [42.0, 42.89], [47.0, 47.73], [49.0, 49.92], [54.0, 61.3], [63.0, 76.25], [79.0, 78.97], [82.0, 84.3], [85.0, 85.73], [87.0, 87.49], [89.0, 90.29], [91.0, 91.81], [94.0, 94.91], [100.0, 100.72], [107.0, 107.6], [115.0, 115.89], [117.0, 118.22], [121.0, 126.94], [127.0, 131.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.88, 0.0, 0.0, 0.0, 50.56, 32.0, 0.0, 38.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.16, 34.31], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 43.24], ["music", 30.16], ["explosion", 5.38]], null, [["speech", 51.27], ["eruption", 4.83], ["hum", 2.5]], null, null, null, null, null, null, null, null, null, [["speech", 92.67], ["fart", 1.61], ["whack, thwack", 0.67]], [["speech", 42.51], ["animal", 15.51], ["dog", 13.35]]], "duration": [5.24, 0.89, 0.73, 0.92, 7.3, 13.25, -0.03, 2.3, 0.73, 0.49, 1.29, 0.81, 0.91, 0.72, 0.6, 0.89, 1.22, 5.94, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/hQogMjsahWU_filtered.json b/annotations_filtered/hQogMjsahWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8114914c3123bc48f66aac229661a924b82f34d9 --- /dev/null +++ b/annotations_filtered/hQogMjsahWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.89], [13.0, 14.93], [17.0, 18.4], [24.0, 24.76], [31.0, 33.13], [39.0, 41.86], [46.0, 48.86], [50.0, 52.0], [55.0, 55.66], [59.0, 60.83], [62.0, 63.09], [64.0, 70.51], [73.0, 75.95], [78.0, 78.09], [79.0, 79.57], [86.0, 87.93], [89.0, 90.04], [91.0, 91.52], [92.0, 93.12], [94.0, 95.13], [98.0, 111.38], [115.0, 115.23]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.28, 44.52, 70.44, 88.83, 0.0, 0.0, 0.0, 52.68, 45.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.99, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 32.92], ["music", 22.26], ["boing", 3.3]], [["fly, housefly", 25.37], ["insect", 11.26], ["mosquito", 8.89]], null, null, null, null, null, null, [["music", 32.63], ["hum", 6.58], ["creak", 6.02]], null, null, null, null, null, null, null, [["theremin", 11.32], ["music", 9.69], ["speech", 7.86]], null], "duration": [-0.11, 1.93, 1.4, 0.76, 2.13, 2.86, 2.86, 2.0, 0.66, 1.83, 1.09, 6.51, 2.95, 0.09, 0.57, 1.93, 1.04, 0.52, 1.12, 1.13, 13.38, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/hR1XzVQnfqY_filtered.json b/annotations_filtered/hR1XzVQnfqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b45b1b302ef0fd6e7070363d8cd45b7db8f5a129 --- /dev/null +++ b/annotations_filtered/hR1XzVQnfqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.56], [14.0, 28.49], [44.0, 46.36], [48.0, 57.0], [60.0, 60.05], [60.0, 65.52], [73.0, 73.33], [76.0, 78.54], [79.0, 80.01], [88.0, 92.47], [95.0, 96.45], [97.0, 103.27], [104.0, 107.06]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 38.05, 31.6, 32.3, 0.0, 35.57, 0.0, 35.22, 0.0, 31.18, 0.0, 52.27, 40.5], "audiomae_on_audioset": [null, [["music", 69.04], ["synthesizer", 8.65], ["musical instrument", 4.8]], [["moo", 16.9], ["fly, housefly", 16.11], ["cattle, bovinae", 12.44]], [["speech", 36.1], ["music", 34.44], ["foghorn", 5.87]], null, [["music", 69.79], ["speech", 6.2], ["musical instrument", 2.81]], null, [["noise", 28.11], ["whale vocalization", 11.19], ["synthesizer", 9.54]], null, [["speech", 46.66], ["siren", 9.59], ["civil defense siren", 7.8]], null, null, [["music", 41.9], ["synthesizer", 10.34], ["speech", 7.42]]], "duration": [0.56, 14.49, 2.36, 9.0, 0.05, 5.52, 0.33, 2.54, 1.01, 4.47, 1.45, 6.27, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/hR4oc1us1aU_filtered.json b/annotations_filtered/hR4oc1us1aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf6cf1a3c7d574b2362f625a1996c810d812535c --- /dev/null +++ b/annotations_filtered/hR4oc1us1aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.4], [10.0, 10.02], [10.0, 11.16], [12.0, 12.29], [13.0, 13.39], [24.0, 25.1], [44.0, 44.85], [47.0, 53.03], [54.0, 54.97], [60.0, 61.23], [63.0, 64.66], [67.0, 67.2], [71.0, 71.17], [75.0, 80.28], [90.0, 92.82], [98.0, 101.98], [104.0, 109.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 29.86, 29.52, 29.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["explosion", 45.36], ["speech", 20.66], ["burst, pop", 8.14]], null, null, null, null, null, [["speech", 65.18], ["groan", 5.43], ["music", 5.24]], [["music", 30.61], ["speech", 27.36], ["whack, thwack", 12.88]], [["speech", 37.32], ["explosion", 9.47], ["whack, thwack", 9.06]], [["whack, thwack", 48.64], ["speech", 10.46], ["thunk", 7.69]]], "duration": [0.4, 0.02, 1.16, 0.29, 0.39, 1.1, 0.85, 6.03, 0.97, 1.23, 1.66, 0.2, 0.17, 5.28, 2.82, 3.98, 5.21]} \ No newline at end of file diff --git a/annotations_filtered/hRBRb2eiK4I_filtered.json b/annotations_filtered/hRBRb2eiK4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15175b67f8351633749287b1c04ebb32ee09f4e0 --- /dev/null +++ b/annotations_filtered/hRBRb2eiK4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 78.81], [83.0, 90.51], [92.0, 93.11], [94.0, 128.71]], "keep_status": [true, false, false, false], "silence_prob": [32.43, 56.93, 0.0, 0.0], "audiomae_on_audioset": [[["buzz", 24.75], ["speech", 22.49], ["music", 8.22]], null, null, null], "duration": [13.81, 7.51, 1.11, 34.71]} \ No newline at end of file diff --git a/annotations_filtered/hRRvrXxGJjg_filtered.json b/annotations_filtered/hRRvrXxGJjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4adc482d27a17c8b70ef2be4fc9451fe503ac3ba --- /dev/null +++ b/annotations_filtered/hRRvrXxGJjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [6.0, 6.98], [10.0, 12.66], [16.0, 16.58], [24.0, 25.08], [26.0, 27.89], [29.0, 30.77], [35.0, 34.82], [35.0, 41.72], [44.0, 45.82], [47.0, 48.95], [51.0, 53.37], [56.0, 62.83], [64.0, 73.36], [78.0, 79.03], [95.0, 99.67], [100.0, 101.88], [105.0, 119.55], [120.0, 122.22], [123.0, 124.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 77.2, 63.53, 65.91, 0.0, 64.75, 0.0, 64.75, 60.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.98, 2.66, 0.58, 1.08, 1.89, 1.77, -0.18, 6.72, 1.82, 1.95, 2.37, 6.83, 9.36, 1.03, 4.67, 1.88, 14.55, 2.22, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/hRa-69uBmIw_filtered.json b/annotations_filtered/hRa-69uBmIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2db607d663d7c2013cea60dd240526559d01df2 --- /dev/null +++ b/annotations_filtered/hRa-69uBmIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [6.0, 6.66], [57.0, 61.87], [70.0, 71.78], [89.0, 89.38]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 30.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 27.3], ["crowd", 16.94], ["applause", 13.15]], null, null], "duration": [0.83, 0.66, 4.87, 1.78, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/hReFx1kjuIE_filtered.json b/annotations_filtered/hReFx1kjuIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75e1e470e8c54687e9bc22a72e02ddacd2505f45 --- /dev/null +++ b/annotations_filtered/hReFx1kjuIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.02], [18.0, 18.13], [19.0, 18.94], [20.0, 38.1], [40.0, 40.63], [42.0, 41.99], [49.0, 51.44], [54.0, 55.27], [57.0, 57.65], [62.0, 70.97], [74.0, 77.79], [83.0, 84.67], [85.0, 85.7], [87.0, 88.72], [95.0, 95.64], [102.0, 105.83], [111.0, 111.45], [117.0, 118.57]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 49.36, 0.0, 0.0, 38.87, 34.82, 0.0, 0.0, 0.0, 0.0, 33.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 34.89], ["mains hum", 17.38], ["noise", 15.47]], null, null, [["speech", 22.35], ["sidetone", 16.48], ["noise", 14.24]], [["speech", 23.32], ["music", 13.43], ["mains hum", 8.65]], null, null, null, null, [["fart", 17.56], ["hum", 10.67], ["mains hum", 8.48]], null, null], "duration": [0.02, 0.13, -0.06, 18.1, 0.63, -0.01, 2.44, 1.27, 0.65, 8.97, 3.79, 1.67, 0.7, 1.72, 0.64, 3.83, 0.45, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/hRfF8Kes77E_filtered.json b/annotations_filtered/hRfF8Kes77E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55014348cd1511c261217b2d2c37301f133262cb --- /dev/null +++ b/annotations_filtered/hRfF8Kes77E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.85], [12.0, 19.82], [22.0, 24.73], [25.0, 26.5], [31.0, 32.58], [49.0, 49.13], [49.0, 53.45], [54.0, 54.26], [61.0, 74.44], [77.0, 77.84], [82.0, 83.51], [89.0, 114.47], [115.0, 117.64], [119.0, 119.1], [119.0, 136.61]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 35.76, 31.23, 0.0, 0.0, 0.0, 38.8, 0.0, 33.02, 0.0, 0.0, 32.13, 36.89, 0.0, 44.09], "audiomae_on_audioset": [null, [["music", 18.0], ["whale vocalization", 14.99], ["noise", 10.6]], [["noise", 31.76], ["grunt", 12.71], ["whale vocalization", 12.45]], null, null, null, [["speech", 43.37], ["music", 34.79], ["electronic music", 2.22]], null, [["speech", 51.42], ["music", 23.18], ["noise", 5.15]], null, null, [["music", 26.87], ["buzz", 16.64], ["speech", 7.39]], [["whale vocalization", 11.03], ["music", 10.39], ["mosquito", 5.55]], null, [["music", 49.78], ["electronic music", 9.79], ["ambient music", 4.97]]], "duration": [1.85, 7.82, 2.73, 1.5, 1.58, 0.13, 4.45, 0.26, 13.44, 0.84, 1.51, 25.47, 2.64, 0.1, 17.61]} \ No newline at end of file diff --git a/annotations_filtered/hRg2HEpwD5A_filtered.json b/annotations_filtered/hRg2HEpwD5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfa6152dfe8dc796de959bc15a842d3f7224073d --- /dev/null +++ b/annotations_filtered/hRg2HEpwD5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [7.0, 8.46], [9.0, 10.05], [12.0, 12.09], [13.0, 14.49], [16.0, 17.59], [23.0, 49.96], [53.0, 58.06], [64.0, 82.44], [82.0, 82.48], [82.0, 82.51], [83.0, 119.91], [120.0, 120.26], [121.0, 138.69], [139.0, 143.16], [144.0, 150.25], [153.0, 161.5], [163.0, 168.67]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.62, 33.14, 30.91, 0.0, 0.0, 0.0, 0.0, 30.78, 30.77, 31.48, 38.94, 57.17], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 50.33], ["whack, thwack", 7.67], ["hum", 4.26]], [["boing", 25.77], ["crowd", 18.94], ["speech", 10.96]], [["music", 27.81], ["whack, thwack", 6.6], ["speech", 3.9]], null, null, null, null, [["music", 56.03], ["speech", 9.94], ["animal", 5.01]], [["vehicle", 34.54], ["motorcycle", 9.94], ["car", 7.87]], [["music", 46.87], ["speech", 7.57], ["explosion", 6.4]], [["sidetone", 26.51], ["noise", 6.58], ["cacophony", 6.44]], null], "duration": [0.74, 1.46, 1.05, 0.09, 1.49, 1.59, 26.96, 5.06, 18.44, 0.48, 0.51, 36.91, 0.26, 17.69, 4.16, 6.25, 8.5, 5.67]} \ No newline at end of file diff --git a/annotations_filtered/hRoE2HRnpkk_filtered.json b/annotations_filtered/hRoE2HRnpkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25cec8d08fd4b09973f747757bf5c7e9a0d1b64c --- /dev/null +++ b/annotations_filtered/hRoE2HRnpkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [7.0, 7.53], [9.0, 9.12], [10.0, 10.37], [11.0, 11.94], [18.0, 19.08], [20.0, 20.9], [22.0, 22.62], [24.0, 24.29], [29.0, 29.39], [33.0, 33.71], [34.0, 35.04], [39.0, 40.0], [41.0, 42.28], [45.0, 44.98], [45.0, 46.31], [49.0, 49.37], [53.0, 53.5], [56.0, 56.1], [57.0, 57.96], [59.0, 60.99], [62.0, 62.26], [64.0, 68.4], [69.0, 70.09], [72.0, 71.78], [81.0, 81.82], [83.0, 83.35], [85.0, 86.12], [89.0, 89.43], [90.0, 90.76], [94.0, 94.37], [95.0, 96.57], [100.0, 101.73], [102.0, 102.54], [104.0, 104.28], [105.0, 105.17], [106.0, 106.69], [108.0, 108.62], [109.0, 121.2], [122.0, 124.33], [125.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 0.53, 0.12, 0.37, 0.94, 1.08, 0.9, 0.62, 0.29, 0.39, 0.71, 1.04, 1.0, 1.28, -0.02, 1.31, 0.37, 0.5, 0.1, 0.96, 1.99, 0.26, 4.4, 1.09, -0.22, 0.82, 0.35, 1.12, 0.43, 0.76, 0.37, 1.57, 1.73, 0.54, 0.28, 0.17, 0.69, 0.62, 12.2, 2.33, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/hSAx87qd-fs_filtered.json b/annotations_filtered/hSAx87qd-fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c50cf0790cfad74b2981f191f4c224e769f124 --- /dev/null +++ b/annotations_filtered/hSAx87qd-fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.9], [18.0, 19.01], [19.0, 20.41], [26.0, 27.06], [28.0, 30.11], [37.0, 37.89], [45.0, 45.69], [48.0, 47.8], [53.0, 54.06], [56.0, 57.6], [58.0, 58.09], [66.0, 67.76], [70.0, 70.48], [71.0, 71.85], [79.0, 80.35], [84.0, 85.58], [88.0, 97.97], [102.0, 105.34], [107.0, 107.35], [108.0, 109.22], [110.0, 110.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.64, 51.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.78], ["speech", 10.92], ["boing", 4.6]], null, null, null, null], "duration": [1.9, 1.01, 1.41, 1.06, 2.11, 0.89, 0.69, -0.2, 1.06, 1.6, 0.09, 1.76, 0.48, 0.85, 1.35, 1.58, 9.97, 3.34, 0.35, 1.22, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/hSBoEivF-hk_filtered.json b/annotations_filtered/hSBoEivF-hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b1d0ccbc8f18c31c075b8791df88ba75732a06 --- /dev/null +++ b/annotations_filtered/hSBoEivF-hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 34.8], [36.0, 36.54], [37.0, 50.85], [52.0, 78.14], [87.0, 89.02], [91.0, 97.34], [99.0, 99.52], [102.0, 103.57], [104.0, 111.18], [111.0, 111.52], [112.0, 114.08], [115.0, 115.3], [116.0, 116.45], [119.0, 122.89], [125.0, 126.45]], "keep_status": [false, false, true, true, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.44, 30.09, 29.49, 31.37, 0.0, 0.0, 30.55, 0.0, 33.62, 0.0, 0.0, 31.65, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.98], ["buzz", 8.04], ["radio", 5.41]], [["music", 60.45], ["livestock, farm animals, working animals", 4.83], ["moo", 4.44]], [["music", 52.76], ["musical instrument", 6.42], ["trombone", 3.89]], [["music", 32.47], ["brass instrument", 18.27], ["speech", 11.0]], null, null, [["music", 47.31], ["speech", 28.52], ["foghorn", 5.95]], null, [["speech", 14.56], ["music", 13.8], ["moo", 5.78]], null, null, [["music", 70.42], ["theremin", 7.87], ["musical instrument", 6.05]], null], "duration": [30.8, 0.54, 13.85, 26.14, 2.02, 6.34, 0.52, 1.57, 7.18, 0.52, 2.08, 0.3, 0.45, 3.89, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/hSLj5cQaXM8_filtered.json b/annotations_filtered/hSLj5cQaXM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..369ebefb56e121edc7f8f22ab07ea9c837ccf86e --- /dev/null +++ b/annotations_filtered/hSLj5cQaXM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.1], [11.0, 25.66], [36.0, 39.61], [40.0, 42.82], [44.0, 54.16], [60.0, 65.85], [66.0, 69.79], [70.0, 73.26], [75.0, 76.62], [77.0, 84.48], [86.0, 105.61], [110.0, 114.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 64.75, 51.23, 60.89, 47.94, 68.28, 54.76, 63.64, 0.0, 93.13, 98.86, 91.13], "audiomae_on_audioset": [null, null, null, null, [["music", 61.6], ["theremin", 9.76], ["synthesizer", 6.81]], null, null, null, null, null, null, null], "duration": [4.1, 14.66, 3.61, 2.82, 10.16, 5.85, 3.79, 3.26, 1.62, 7.48, 19.61, 4.2]} \ No newline at end of file diff --git a/annotations_filtered/hSUo-HJ01kY_filtered.json b/annotations_filtered/hSUo-HJ01kY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc1367b75edf654fd1e8475541bab69fe07c3e80 --- /dev/null +++ b/annotations_filtered/hSUo-HJ01kY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.36], [26.0, 26.57], [28.0, 29.54], [34.0, 41.27], [53.0, 54.57], [57.0, 61.91], [67.0, 94.36], [100.0, 101.02], [101.0, 102.74], [109.0, 118.91], [121.0, 124.19], [128.0, 127.9]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [29.63, 0.0, 0.0, 81.0, 0.0, 30.85, 31.0, 0.0, 0.0, 32.93, 99.98, 0.0], "audiomae_on_audioset": [[["music", 41.47], ["hum", 14.19], ["electronic music", 10.8]], null, null, null, null, [["music", 45.56], ["speech", 4.93], ["synthesizer", 3.51]], [["music", 61.52], ["didgeridoo", 7.25], ["electronic music", 5.91]], null, null, [["music", 59.48], ["musical instrument", 7.77], ["speech", 4.27]], null, null], "duration": [6.36, 0.57, 1.54, 7.27, 1.57, 4.91, 27.36, 1.02, 1.74, 9.91, 3.19, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/hSe6p6SLuvI_filtered.json b/annotations_filtered/hSe6p6SLuvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0715214f2090a45f700a8a93218fb32d8c1d2b85 --- /dev/null +++ b/annotations_filtered/hSe6p6SLuvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.32], [14.0, 16.41], [17.0, 17.63], [25.0, 26.74], [33.0, 33.52], [36.0, 36.1], [37.0, 37.42], [38.0, 38.97], [40.0, 40.69], [53.0, 54.23], [54.0, 54.6], [61.0, 61.74], [82.0, 82.24], [83.0, 84.18], [88.0, 92.75], [95.0, 95.94], [97.0, 97.01], [98.0, 98.49], [103.0, 103.62], [106.0, 106.98], [108.0, 108.46], [110.0, 110.35], [110.0, 111.62], [117.0, 118.27], [119.0, 119.35], [121.0, 120.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.91, 40.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.94], ["didgeridoo", 33.89], ["foghorn", 8.43]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.92], ["music", 3.93], ["noise", 3.65]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.32, 2.41, 0.63, 1.74, 0.52, 0.1, 0.42, 0.97, 0.69, 1.23, 0.6, 0.74, 0.24, 1.18, 4.75, 0.94, 0.01, 0.49, 0.62, 0.98, 0.46, 0.35, 1.62, 1.27, 0.35, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/hSgNZ6R5Rbg_filtered.json b/annotations_filtered/hSgNZ6R5Rbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8a607854f1450e8d85bb5b9fe61401348c41187 --- /dev/null +++ b/annotations_filtered/hSgNZ6R5Rbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 62.77]], "keep_status": [false], "silence_prob": [31.26], "audiomae_on_audioset": [[["music", 51.55], ["theremin", 23.02], ["speech", 3.11]]], "duration": [14.77]} \ No newline at end of file diff --git a/annotations_filtered/hSvJRk5OH_o_filtered.json b/annotations_filtered/hSvJRk5OH_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8385f7ef8f55596727b32e470a70f940250d51a1 --- /dev/null +++ b/annotations_filtered/hSvJRk5OH_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 33.56], [38.0, 38.25], [40.0, 63.46], [65.0, 69.87], [71.0, 73.74], [74.0, 89.68], [91.0, 93.75], [94.0, 100.5], [102.0, 115.72], [120.0, 134.87], [137.0, 137.94], [139.0, 174.33]], "keep_status": [false, false, false, true, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 28.48, 28.91, 28.37, 28.86, 36.22, 28.64, 28.46, 28.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 50.21], ["whip", 15.16], ["whack, thwack", 5.56]], [["explosion", 23.81], ["music", 18.79], ["throbbing", 9.24]], [["speech", 30.42], ["whoosh, swoosh, swish", 18.08], ["sound effect", 9.94]], [["mains hum", 20.32], ["music", 18.92], ["hum", 15.67]], [["hum", 17.66], ["whale vocalization", 8.82], ["mains hum", 8.76]], [["speech", 42.83], ["music", 24.27], ["hum", 7.12]], [["music", 30.05], ["vehicle", 9.0], ["motorcycle", 7.18]], [["horse", 31.73], ["neigh, whinny", 14.96], ["music", 13.24]], null, null], "duration": [32.56, 0.25, 23.46, 4.87, 2.74, 15.68, 2.75, 6.5, 13.72, 14.87, 0.94, 35.33]} \ No newline at end of file diff --git a/annotations_filtered/hSwy6UI-djc_filtered.json b/annotations_filtered/hSwy6UI-djc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04764ad365439523364b528f26e27a9b2bca4463 --- /dev/null +++ b/annotations_filtered/hSwy6UI-djc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [2.0, 2.84], [5.0, 5.98], [9.0, 9.9], [29.0, 33.47], [45.0, 46.3], [65.0, 65.03], [66.0, 66.39], [68.0, 70.75], [71.0, 71.68], [73.0, 74.49], [77.0, 77.11], [78.0, 78.12], [86.0, 86.53], [97.0, 97.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.84, 0.98, 0.9, 4.47, 1.3, 0.03, 0.39, 2.75, 0.68, 1.49, 0.11, 0.12, 0.53, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/hTF5JMKgI1I_filtered.json b/annotations_filtered/hTF5JMKgI1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/hTF5JMKgI1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/hT_CiaTcnN8_filtered.json b/annotations_filtered/hT_CiaTcnN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..077a548041060754c53887194022e334d50e2795 --- /dev/null +++ b/annotations_filtered/hT_CiaTcnN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 22.15], [23.0, 30.0], [30.0, 32.16], [32.0, 33.98], [40.0, 41.59], [48.0, 58.6]], "keep_status": [true, false, false, false, false, true], "silence_prob": [29.99, 28.94, 30.07, 0.0, 0.0, 29.24], "audiomae_on_audioset": [[["music", 36.18], ["speech", 18.08], ["didgeridoo", 11.79]], [["mains hum", 34.1], ["music", 20.53], ["hum", 15.9]], [["music", 43.76], ["speech", 21.93], ["sidetone", 13.01]], null, null, [["speech", 21.27], ["music", 20.28], ["throbbing", 19.16]]], "duration": [11.15, 7.0, 2.16, 1.98, 1.59, 10.6]} \ No newline at end of file diff --git a/annotations_filtered/hT_G4j4nI-8_filtered.json b/annotations_filtered/hT_G4j4nI-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ac2f2b38e14c1fb983f32cfb087dad7ddc743e --- /dev/null +++ b/annotations_filtered/hT_G4j4nI-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.08], [23.0, 25.46], [32.0, 32.66], [45.0, 50.95], [57.0, 60.25]], "keep_status": [false, true, false, true, true], "silence_prob": [0.0, 40.24, 0.0, 32.29, 30.71], "audiomae_on_audioset": [null, [["music", 20.18], ["fart", 9.66], ["speech", 8.36]], null, [["speech", 35.1], ["music", 7.83], ["sidetone", 6.26]], [["crowd", 15.83], ["echo", 11.27], ["cheering", 10.92]]], "duration": [1.08, 2.46, 0.66, 5.95, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/hTpVCu5DzpA_filtered.json b/annotations_filtered/hTpVCu5DzpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8958d44d8245339b1c83b68cc0de7e61e834dc18 --- /dev/null +++ b/annotations_filtered/hTpVCu5DzpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.62], [28.0, 28.16], [30.0, 30.48], [32.0, 33.57], [35.0, 72.93], [76.0, 78.02], [79.0, 105.61], [106.0, 113.51], [117.0, 118.39], [119.0, 148.76], [150.0, 158.01]], "keep_status": [true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [31.48, 0.0, 0.0, 0.0, 0.0, 31.66, 31.98, 30.83, 0.0, 31.36, 32.9], "audiomae_on_audioset": [[["music", 54.31], ["vehicle", 6.63], ["carnatic music", 4.27]], null, null, null, null, [["music", 48.03], ["throbbing", 11.77], ["roar", 9.11]], [["boing", 77.74], ["music", 12.76], ["cattle, bovinae", 2.38]], [["music", 26.53], ["sidetone", 26.3], ["throbbing", 10.28]], null, [["speech", 41.31], ["music", 27.3], ["throbbing", 4.04]], [["livestock, farm animals, working animals", 38.05], ["cattle, bovinae", 16.28], ["moo", 10.29]]], "duration": [18.62, 0.16, 0.48, 1.57, 37.93, 2.02, 26.61, 7.51, 1.39, 29.76, 8.01]} \ No newline at end of file diff --git a/annotations_filtered/hTzUYt__ogY_filtered.json b/annotations_filtered/hTzUYt__ogY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d248a78efdac0411978a997ff02929cef89816c --- /dev/null +++ b/annotations_filtered/hTzUYt__ogY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 21.57], [22.0, 23.72], [24.0, 24.93]], "keep_status": [false, false, false], "silence_prob": [60.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [3.57, 1.72, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/hTzqKlFConk_filtered.json b/annotations_filtered/hTzqKlFConk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef84c919cfd67cdd309a96588aa2d0a89184d0a --- /dev/null +++ b/annotations_filtered/hTzqKlFConk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.99], [29.0, 32.53], [36.0, 36.64], [37.0, 40.0], [44.0, 47.83], [64.0, 65.28], [78.0, 79.27], [90.0, 95.91], [108.0, 115.94]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [31.45, 30.78, 0.0, 29.47, 32.18, 0.0, 0.0, 30.59, 30.03], "audiomae_on_audioset": [[["music", 55.52], ["didgeridoo", 10.22], ["musical instrument", 6.15]], [["music", 63.51], ["musical instrument", 12.44], ["theremin", 3.64]], null, [["music", 57.52], ["carnatic music", 7.11], ["foghorn", 4.74]], [["music", 43.79], ["speech", 11.54], ["boing", 9.25]], null, null, [["music", 75.21], ["synthesizer", 4.61], ["musical instrument", 3.13]], [["insect", 25.67], ["fly, housefly", 22.58], ["music", 21.77]]], "duration": [2.99, 3.53, 0.64, 3.0, 3.83, 1.28, 1.27, 5.91, 7.94]} \ No newline at end of file diff --git a/annotations_filtered/hUAGX1IOMr0_filtered.json b/annotations_filtered/hUAGX1IOMr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d23f5bf6ad8a37b946d96735d692237809ab8764 --- /dev/null +++ b/annotations_filtered/hUAGX1IOMr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [9.0, 13.66], [14.0, 21.3], [22.0, 22.72], [39.0, 58.02], [60.0, 63.21], [72.0, 72.69], [74.0, 74.78], [77.0, 77.65], [85.0, 86.8], [93.0, 94.15], [108.0, 107.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.97, 61.47, 0.0, 31.98, 44.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["synthesizer", 29.27], ["music", 21.1], ["keyboard (musical)", 20.15]], [["speech", 51.06], ["crowd", 9.66], ["applause", 9.58]], null, null, null, null, null, null], "duration": [0.34, 4.66, 7.3, 0.72, 19.02, 3.21, 0.69, 0.78, 0.65, 1.8, 1.15, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/hV2om9YBADI_filtered.json b/annotations_filtered/hV2om9YBADI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ecbb02817f5b1684dc8e1f4a0abf64dd0263f2 --- /dev/null +++ b/annotations_filtered/hV2om9YBADI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.74], [21.0, 22.82], [23.0, 25.74], [27.0, 31.92], [34.0, 35.14], [41.0, 41.01], [45.0, 46.43], [49.0, 49.03], [54.0, 54.99], [59.0, 59.95], [65.0, 66.06], [67.0, 68.37], [69.0, 70.36], [73.0, 73.26], [74.0, 75.09], [79.0, 79.46], [90.0, 90.02], [91.0, 91.1], [91.0, 92.65], [96.0, 95.88], [97.0, 100.85], [102.0, 103.2], [105.0, 108.03], [111.0, 111.33], [119.0, 121.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 99.99, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 1.82, 2.74, 4.92, 1.14, 0.01, 1.43, 0.03, 0.99, 0.95, 1.06, 1.37, 1.36, 0.26, 1.09, 0.46, 0.02, 0.1, 1.65, -0.12, 3.85, 1.2, 3.03, 0.33, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/hV55sjy1QFI_filtered.json b/annotations_filtered/hV55sjy1QFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad3e10d5a9ef7d9c98197e1a62304fcfff71208 --- /dev/null +++ b/annotations_filtered/hV55sjy1QFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [6.0, 6.83], [15.0, 17.44], [35.0, 35.8], [36.0, 36.85], [38.0, 44.31], [60.0, 60.54], [65.0, 65.08], [68.0, 69.58], [76.0, 91.32], [94.0, 94.85], [96.0, 96.79], [98.0, 99.1], [103.0, 103.44], [104.0, 108.35], [112.0, 112.67], [122.0, 135.41], [136.0, 138.81], [140.0, 144.85], [146.0, 146.96], [150.0, 154.75], [156.0, 166.18]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.66, 0.0, 0.0, 28.86, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 0.0, 0.0, 34.95, 0.0, 30.67, 34.48, 30.11, 0.0, 30.59, 30.14], "audiomae_on_audioset": [null, null, [["music", 25.73], ["smash, crash", 18.21], ["speech", 14.23]], null, null, [["music", 30.26], ["skidding", 17.45], ["vehicle", 14.04]], null, null, null, [["music", 72.44], ["throbbing", 6.23], ["didgeridoo", 4.95]], null, null, null, null, [["speech", 21.53], ["music", 19.89], ["throbbing", 13.12]], null, [["music", 71.59], ["hum", 6.78], ["speech", 5.89]], [["music", 39.38], ["speech", 22.66], ["throbbing", 8.44]], [["music", 44.92], ["throbbing", 8.31], ["techno", 6.89]], null, [["music", 36.58], ["speech", 18.54], ["throbbing", 16.99]], [["music", 69.53], ["throbbing", 11.0], ["soundtrack music", 3.8]]], "duration": [0.5, 0.83, 2.44, 0.8, 0.85, 6.31, 0.54, 0.08, 1.58, 15.32, 0.85, 0.79, 1.1, 0.44, 4.35, 0.67, 13.41, 2.81, 4.85, 0.96, 4.75, 10.18]} \ No newline at end of file diff --git a/annotations_filtered/hVGl1d8hRBI_filtered.json b/annotations_filtered/hVGl1d8hRBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..037b537f35d6fc59a5af6ab054e898af30362631 --- /dev/null +++ b/annotations_filtered/hVGl1d8hRBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.53], [17.0, 72.91]], "keep_status": [false, false], "silence_prob": [29.82, 0.0], "audiomae_on_audioset": [[["speech", 62.59], ["electric shaver, electric razor", 5.5], ["music", 4.9]], null], "duration": [7.53, 55.91]} \ No newline at end of file diff --git a/annotations_filtered/hVQT9mDDeJo_filtered.json b/annotations_filtered/hVQT9mDDeJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..452b9ba39adc4f1fb8b827367a4d872425cc414f --- /dev/null +++ b/annotations_filtered/hVQT9mDDeJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.35], [10.0, 12.26], [23.0, 23.01], [27.0, 28.86], [30.0, 30.33], [31.0, 33.51], [39.0, 40.05], [52.0, 52.03], [60.0, 60.72], [64.0, 64.18], [67.0, 67.2], [78.0, 79.0], [87.0, 87.3], [91.0, 91.96], [92.0, 95.23], [98.0, 99.89], [100.0, 100.7], [104.0, 103.64], [104.0, 104.5], [108.0, 109.73], [120.0, 121.15], [133.0, 133.27], [133.0, 133.34], [134.0, 134.15], [136.0, 137.54], [141.0, 140.8], [146.0, 146.87], [150.0, 151.02], [160.0, 160.74]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.85, 63.96, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 27.04], ["chirp tone", 25.81], ["throbbing", 13.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.35, 2.26, 0.01, 1.86, 0.33, 2.51, 1.05, 0.03, 0.72, 0.18, 0.2, 1.0, 0.3, 0.96, 3.23, 1.89, 0.7, -0.36, 0.5, 1.73, 1.15, 0.27, 0.34, 0.15, 1.54, -0.2, 0.87, 1.02, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/hVZ9AGQL_oo_filtered.json b/annotations_filtered/hVZ9AGQL_oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3da98c3e784aaa610d5eaefe965bb548b89059ca --- /dev/null +++ b/annotations_filtered/hVZ9AGQL_oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.65], [26.0, 26.77], [27.0, 27.99], [29.0, 29.78], [32.0, 33.1], [35.0, 34.86], [40.0, 40.0], [41.0, 41.96], [43.0, 44.02], [45.0, 44.83], [45.0, 46.03], [49.0, 51.07], [51.0, 51.81], [52.0, 53.08], [53.0, 54.45], [55.0, 55.7], [57.0, 57.0], [58.0, 58.73], [60.0, 74.51], [95.0, 94.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.19], ["speech", 25.67], ["guitar", 4.13]], null], "duration": [0.65, 0.77, 0.99, 0.78, 1.1, -0.14, 0.0, 0.96, 1.02, -0.17, 1.03, 2.07, 0.81, 1.08, 1.45, 0.7, 0.0, 0.73, 14.51, -0.31]} \ No newline at end of file diff --git a/annotations_filtered/hVxEoBe1UVg_filtered.json b/annotations_filtered/hVxEoBe1UVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0f8934cadb3459df287a7307f399907ee2b4a52 --- /dev/null +++ b/annotations_filtered/hVxEoBe1UVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.08], [5.0, 5.48], [6.0, 6.84], [9.0, 9.63], [11.0, 12.14], [14.0, 14.81], [18.0, 20.06], [27.0, 28.27], [32.0, 32.19], [33.0, 33.79], [35.0, 38.01], [38.0, 41.05], [42.0, 44.44], [46.0, 49.13], [51.0, 52.14], [54.0, 55.78], [57.0, 62.09], [63.0, 65.18], [66.0, 66.95], [69.0, 69.69], [70.0, 71.52], [75.0, 76.03], [77.0, 78.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 37.22, 49.5, 91.98, 91.81, 0.0, 0.0, 58.55, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["radio", 42.79], ["electric shaver, electric razor", 11.04], ["speech", 9.52]], [["sidetone", 20.24], ["radio", 17.15], ["hum", 15.11]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 0.48, 0.84, 0.63, 1.14, 0.81, 2.06, 1.27, 0.19, 0.79, 3.01, 3.05, 2.44, 3.13, 1.14, 1.78, 5.09, 2.18, 0.95, 0.69, 1.52, 1.03, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/hW1KqOVCeKw_filtered.json b/annotations_filtered/hW1KqOVCeKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c8a472d356889a243de2970e35041bb87254240 --- /dev/null +++ b/annotations_filtered/hW1KqOVCeKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [3.0, 4.29], [6.0, 7.11], [13.0, 14.18], [19.0, 19.03], [22.0, 23.8], [24.0, 24.93], [32.0, 32.41], [34.0, 35.43], [38.0, 38.48], [39.0, 38.7], [40.0, 41.13], [43.0, 49.5], [50.0, 54.85], [55.0, 57.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.83, 86.09, 40.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.39], ["whale vocalization", 20.06], ["hum", 8.45]]], "duration": [0.25, 1.29, 1.11, 1.18, 0.03, 1.8, 0.93, 0.41, 1.43, 0.48, -0.3, 1.13, 6.5, 4.85, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/hWRG6Oar-aM_filtered.json b/annotations_filtered/hWRG6Oar-aM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdea72d8965dd01862b17460d45ca11f1d67990b --- /dev/null +++ b/annotations_filtered/hWRG6Oar-aM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 33.51], [34.0, 39.04], [41.0, 43.09], [44.0, 53.91], [54.0, 55.9], [58.0, 58.94], [60.0, 65.99], [66.0, 67.24], [70.0, 72.91], [78.0, 78.27], [79.0, 81.77], [85.0, 96.79], [99.0, 99.44]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [60.7, 38.88, 67.0, 45.08, 0.0, 0.0, 61.97, 0.0, 57.25, 0.0, 29.16, 29.1, 0.0], "audiomae_on_audioset": [null, [["hum", 23.31], ["aircraft", 9.81], ["mains hum", 7.35]], null, [["aircraft", 14.71], ["fixed-wing aircraft, airplane", 11.77], ["hum", 11.43]], null, null, null, null, null, null, [["speech", 63.94], ["music", 8.58], ["vehicle", 2.31]], [["speech", 29.33], ["aircraft", 16.51], ["vehicle", 14.38]], null], "duration": [6.51, 5.04, 2.09, 9.91, 1.9, 0.94, 5.99, 1.24, 2.91, 0.27, 2.77, 11.79, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/hWRJQvuhs9w_filtered.json b/annotations_filtered/hWRJQvuhs9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba2503e6cbacc802b40514284bea7859360a368 --- /dev/null +++ b/annotations_filtered/hWRJQvuhs9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.13], [11.0, 28.78]], "keep_status": [false, true], "silence_prob": [0.0, 34.56], "audiomae_on_audioset": [null, [["hum", 23.98], ["throbbing", 10.55], ["echo", 10.25]]], "duration": [1.13, 17.78]} \ No newline at end of file diff --git a/annotations_filtered/hW_NzisexqU_filtered.json b/annotations_filtered/hW_NzisexqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdd4e6013a28ad48d41862e7c18db4b2aa653f67 --- /dev/null +++ b/annotations_filtered/hW_NzisexqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.89], [24.0, 24.17], [26.0, 26.62], [50.0, 50.26], [55.0, 55.61], [72.0, 73.28], [86.0, 87.07], [88.0, 94.31], [95.0, 97.23], [123.0, 124.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.17, 0.62, 0.26, 0.61, 1.28, 1.07, 6.31, 2.23, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/hX-ezXejcU0_filtered.json b/annotations_filtered/hX-ezXejcU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..808566eee2af3aeb88e29e43f5ed39783a259f2f --- /dev/null +++ b/annotations_filtered/hX-ezXejcU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.36], [37.0, 38.92], [39.0, 38.96], [39.0, 39.41], [39.0, 78.95], [81.0, 89.88], [90.0, 90.69], [92.0, 92.69], [94.0, 94.74], [97.0, 98.0], [98.0, 155.66]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.63, 0.0, 0.0, 0.0, 0.0, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.6], ["drum", 6.31], ["speech", 5.3]], null, null, null, null, [["music", 23.46], ["boing", 15.11], ["whack, thwack", 13.81]], null, null, null, null, null], "duration": [15.36, 1.92, -0.04, 0.41, 39.95, 8.88, 0.69, 0.69, 0.74, 1.0, 57.66]} \ No newline at end of file diff --git a/annotations_filtered/hX5s15LBHqo_filtered.json b/annotations_filtered/hX5s15LBHqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58b30ea018e451611a09d0c7e9f0341541524e75 --- /dev/null +++ b/annotations_filtered/hX5s15LBHqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.74], [16.0, 16.12], [22.0, 22.52], [23.0, 23.35], [34.0, 38.06], [45.0, 45.49], [49.0, 51.06], [52.0, 53.65], [55.0, 56.79], [58.0, 58.23], [59.0, 59.86], [61.0, 62.45], [64.0, 64.96], [82.0, 89.55], [92.0, 93.39], [95.0, 95.47], [107.0, 110.3], [116.0, 121.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 40.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 89.9, 32.57], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 58.05], ["speech", 20.38], ["mains hum", 3.35]], null, null, null, null, null, null, null, null, null, null, [["speech", 15.62], ["music", 13.34], ["livestock, farm animals, working animals", 11.34]]], "duration": [1.74, 0.12, 0.52, 0.35, 4.06, 0.49, 2.06, 1.65, 1.79, 0.23, 0.86, 1.45, 0.96, 7.55, 1.39, 0.47, 3.3, 5.12]} \ No newline at end of file diff --git a/annotations_filtered/hXCaF68sDPU_filtered.json b/annotations_filtered/hXCaF68sDPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0baae00e1cd4e8ac2e7a563d4e4bef5248ed0d08 --- /dev/null +++ b/annotations_filtered/hXCaF68sDPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.71], [17.0, 18.27], [22.0, 24.43], [24.0, 24.48], [27.0, 36.73], [38.0, 110.24]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.48, 0.0, 29.41, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.18], ["theremin", 8.89], ["musical instrument", 2.51]], null, [["cattle, bovinae", 37.58], ["moo", 27.33], ["livestock, farm animals, working animals", 21.13]], null], "duration": [-0.29, 1.27, 2.43, 0.48, 9.73, 72.24]} \ No newline at end of file diff --git a/annotations_filtered/hXWDSeVeaAE_filtered.json b/annotations_filtered/hXWDSeVeaAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b592f64628586f745bedac2a7f622de00e4176b2 --- /dev/null +++ b/annotations_filtered/hXWDSeVeaAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [53.0, 66.5], [69.0, 69.75], [72.0, 72.35], [74.0, 75.12], [79.0, 79.46], [81.0, 83.64], [85.0, 88.57], [90.0, 91.39], [95.0, 95.66], [98.0, 100.99], [104.0, 104.18], [107.0, 108.48], [114.0, 114.66], [118.0, 118.23], [119.0, 119.6], [126.0, 126.39], [128.0, 128.92], [131.0, 134.57], [135.0, 138.79], [140.0, 143.78]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 39.91, 49.59, 0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 42.84, 54.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 42.78], ["speech", 12.56], ["bass guitar", 5.25]], [["music", 35.21], ["speech", 24.24], ["sidetone", 9.27]], null, null, null, null, null, null, null, null, null, null, null, [["music", 50.67], ["speech", 11.37], ["synthesizer", 7.35]], null], "duration": [0.6, 13.5, 0.75, 0.35, 1.12, 0.46, 2.64, 3.57, 1.39, 0.66, 2.99, 0.18, 1.48, 0.66, 0.23, 0.6, 0.39, 0.92, 3.57, 3.79, 3.78]} \ No newline at end of file diff --git a/annotations_filtered/hXce5-f8mkA_filtered.json b/annotations_filtered/hXce5-f8mkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a4badf752970ae20996083bcdee6287aa28e684 --- /dev/null +++ b/annotations_filtered/hXce5-f8mkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.96], [29.0, 29.39], [31.0, 32.85], [38.0, 39.02], [46.0, 46.09], [46.0, 48.36], [51.0, 59.44], [65.0, 66.18]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [31.66, 0.0, 0.0, 0.0, 0.0, 36.34, 30.63, 0.0], "audiomae_on_audioset": [[["music", 72.01], ["throbbing", 8.88], ["hum", 4.14]], null, null, null, null, [["quack", 32.32], ["music", 22.58], ["duck", 16.98]], [["cattle, bovinae", 24.9], ["livestock, farm animals, working animals", 20.33], ["music", 19.21]], null], "duration": [5.96, 0.39, 1.85, 1.02, 0.09, 2.36, 8.44, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/hYIWCm-Lpj0_filtered.json b/annotations_filtered/hYIWCm-Lpj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96b28153575eb8c0d9075a2f41262cdf03c27521 --- /dev/null +++ b/annotations_filtered/hYIWCm-Lpj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.71], [14.0, 19.99], [28.0, 28.83], [32.0, 43.28], [45.0, 45.55], [47.0, 47.75], [51.0, 51.56], [55.0, 55.88], [59.0, 63.78], [69.0, 69.25], [73.0, 76.62], [78.0, 78.81], [80.0, 87.81], [90.0, 90.59], [107.0, 106.83], [112.0, 114.47], [116.0, 117.9], [119.0, 121.34], [126.0, 126.98], [130.0, 130.77], [132.0, 132.02], [134.0, 134.77], [137.0, 137.25], [144.0, 143.75], [150.0, 152.29], [153.0, 154.52], [165.0, 165.82]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.92, 0.0, 30.75, 0.0, 0.0, 0.0, 0.0, 29.8, 0.0, 29.92, 0.0, 34.98, 0.0, 0.0, 49.73, 0.0, 46.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 47.87], ["vehicle", 12.39], ["boat, water vehicle", 2.92]], null, [["speech", 73.62], ["crowd", 2.57], ["horse", 2.46]], null, null, null, null, [["cattle, bovinae", 35.2], ["moo", 15.12], ["speech", 14.59]], null, [["zipper (clothing)", 12.76], ["music", 9.28], ["cacophony", 7.65]], null, [["hum", 26.16], ["noise", 21.96], ["mains hum", 7.98]], null, null, [["hum", 22.96], ["music", 10.83], ["mains hum", 8.11]], null, [["theremin", 19.18], ["music", 17.08], ["speech", 14.24]], null, null, null, null, null, null, null, null, null], "duration": [0.71, 5.99, 0.83, 11.28, 0.55, 0.75, 0.56, 0.88, 4.78, 0.25, 3.62, 0.81, 7.81, 0.59, -0.17, 2.47, 1.9, 2.34, 0.98, 0.77, 0.02, 0.77, 0.25, -0.25, 2.29, 1.52, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/hYNYTcpIDSs_filtered.json b/annotations_filtered/hYNYTcpIDSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a08e035f197a5e851541774a3bb3671849d484ab --- /dev/null +++ b/annotations_filtered/hYNYTcpIDSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.04], [12.0, 15.6], [17.0, 60.44], [60.0, 60.51], [61.0, 60.74], [61.0, 60.94], [61.0, 63.9], [64.0, 65.55], [66.0, 72.2], [75.0, 89.97], [91.0, 109.9], [111.0, 111.91], [114.0, 115.38], [116.0, 116.68], [119.0, 119.25], [122.0, 123.96], [125.0, 127.3], [129.0, 130.59]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [58.64, 68.54, 0.0, 0.0, 0.0, 0.0, 31.06, 0.0, 31.92, 31.42, 32.32, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 41.44], ["didgeridoo", 13.74], ["music", 9.32]], null, [["music", 53.11], ["synthesizer", 6.03], ["hum", 5.62]], [["speech", 54.04], ["music", 14.96], ["hum", 3.12]], [["speech", 54.22], ["music", 12.79], ["sidetone", 5.44]], null, null, null, null, null, [["music", 51.01], ["musical instrument", 2.65], ["speech", 2.11]], null], "duration": [9.04, 3.6, 43.44, 0.51, -0.26, -0.06, 2.9, 1.55, 6.2, 14.97, 18.9, 0.91, 1.38, 0.68, 0.25, 1.96, 2.3, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/hYQIObd_bog_filtered.json b/annotations_filtered/hYQIObd_bog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6eebf4a23d480735e990b2fe7ccdff41cb69608e --- /dev/null +++ b/annotations_filtered/hYQIObd_bog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.15], [16.0, 17.27], [29.0, 29.69], [32.0, 44.74], [52.0, 62.7], [64.0, 64.62], [65.0, 66.51], [69.0, 69.77], [75.0, 97.77], [98.0, 99.17], [101.0, 104.38], [105.0, 107.49], [111.0, 111.55], [119.0, 125.19], [164.0, 164.44]], "keep_status": [true, false, false, true, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [31.94, 0.0, 0.0, 31.11, 47.05, 0.0, 0.0, 0.0, 38.98, 0.0, 44.2, 44.43, 0.0, 37.96, 0.0], "audiomae_on_audioset": [[["music", 16.38], ["hum", 12.58], ["sonar", 10.66]], null, null, [["music", 26.64], ["hum", 12.5], ["cacophony", 11.79]], [["hum", 34.86], ["mains hum", 16.17], ["music", 12.44]], null, null, null, [["hum", 47.78], ["throbbing", 17.69], ["music", 8.26]], null, [["music", 28.89], ["glass", 11.29], ["hum", 7.73]], [["music", 43.88], ["ambient music", 8.82], ["hum", 7.33]], null, [["hum", 61.94], ["throbbing", 18.24], ["music", 5.01]], null], "duration": [4.15, 1.27, 0.69, 12.74, 10.7, 0.62, 1.51, 0.77, 22.77, 1.17, 3.38, 2.49, 0.55, 6.19, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/hYq75Gm4UdI_filtered.json b/annotations_filtered/hYq75Gm4UdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e72545b0abc3f9c9c8d020801cd2b4b34cc5b408 --- /dev/null +++ b/annotations_filtered/hYq75Gm4UdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [8.0, 8.7], [9.0, 11.21], [13.0, 13.41], [14.0, 19.16], [21.0, 21.1], [24.0, 29.2], [31.0, 31.67], [34.0, 34.3], [37.0, 38.48], [40.0, 40.09], [41.0, 41.66], [56.0, 65.03], [67.0, 67.83], [77.0, 78.6], [83.0, 85.4], [87.0, 88.2], [90.0, 90.68], [93.0, 97.5], [103.0, 103.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.27, 0.0, 78.21, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 93.13, 0.0, 0.0, 58.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.7, 2.21, 0.41, 5.16, 0.1, 5.2, 0.67, 0.3, 1.48, 0.09, 0.66, 9.03, 0.83, 1.6, 2.4, 1.2, 0.68, 4.5, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/hYvxbtiGvrk_filtered.json b/annotations_filtered/hYvxbtiGvrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc827a8e782c07f5690eac1c3324252f01353bf --- /dev/null +++ b/annotations_filtered/hYvxbtiGvrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.11], [24.0, 24.44], [26.0, 26.4], [28.0, 29.0], [29.0, 29.66], [30.0, 31.87], [33.0, 44.9], [46.0, 51.04], [53.0, 142.74]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.77, 30.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 36.58], ["didgeridoo", 24.67], ["speech", 14.35]], [["music", 63.34], ["speech", 11.99], ["musical instrument", 6.25]], null], "duration": [0.11, 0.44, 0.4, 1.0, 0.66, 1.87, 11.9, 5.04, 89.74]} \ No newline at end of file diff --git a/annotations_filtered/hZ8PfLIc8MI_filtered.json b/annotations_filtered/hZ8PfLIc8MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b65a723e2fa36beaffcbfc151e17f524312a847b --- /dev/null +++ b/annotations_filtered/hZ8PfLIc8MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [3.0, 9.32], [14.0, 15.03], [16.0, 16.31], [17.0, 18.39], [19.0, 18.77], [19.0, 21.2], [24.0, 26.77], [30.0, 33.66], [36.0, 37.29], [38.0, 54.45], [55.0, 54.67], [55.0, 54.94], [55.0, 54.99], [55.0, 56.4], [60.0, 60.39], [64.0, 65.64], [73.0, 74.34], [77.0, 79.17], [99.0, 102.76], [104.0, 105.21], [105.0, 105.51], [108.0, 108.57], [110.0, 111.45], [113.0, 113.83], [117.0, 116.61]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 33.77, 0.0, 0.0, 0.0, 0.0, 33.01, 58.72, 45.27, 0.0, 33.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.04, 43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 12.41], ["door", 11.14], ["crushing", 9.65]], null, null, null, null, [["radio", 22.35], ["sidetone", 15.22], ["fart", 14.29]], null, [["sidetone", 82.88], ["noise", 3.03], ["speech", 2.76]], null, [["speech", 51.31], ["sidetone", 24.08], ["hum", 7.88]], null, null, null, null, null, null, null, [["speech", 22.98], ["grunt", 19.34], ["animal", 4.13]], [["burping, eructation", 16.12], ["speech", 10.9], ["throat clearing", 7.01]], null, null, null, null, null, null], "duration": [0.65, 6.32, 1.03, 0.31, 1.39, -0.23, 2.2, 2.77, 3.66, 1.29, 16.45, -0.33, -0.06, -0.01, 1.4, 0.39, 1.64, 1.34, 2.17, 3.76, 1.21, 0.51, 0.57, 1.45, 0.83, -0.39]} \ No newline at end of file diff --git a/annotations_filtered/hZPz4w3jLXI_filtered.json b/annotations_filtered/hZPz4w3jLXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..328cf06263ae313c23e526456119047eb0231297 --- /dev/null +++ b/annotations_filtered/hZPz4w3jLXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [6.0, 6.83], [8.0, 8.65], [14.0, 21.34], [23.0, 24.17], [30.0, 35.45], [38.0, 39.7], [42.0, 42.85], [43.0, 46.89], [47.0, 49.45], [50.0, 50.84], [51.0, 52.3], [55.0, 55.66], [56.0, 56.24], [59.0, 60.03], [64.0, 64.84], [69.0, 74.98], [75.0, 75.02], [76.0, 88.6], [93.0, 93.66], [94.0, 94.31], [95.0, 96.48], [98.0, 99.52], [102.0, 104.01], [106.0, 106.19], [106.0, 114.44], [116.0, 119.03], [122.0, 123.28], [126.0, 127.52], [129.0, 130.0], [131.0, 131.99], [134.0, 135.58], [136.0, 140.09], [141.0, 142.28], [144.0, 144.41], [146.0, 150.03], [153.0, 153.12], [154.0, 154.23]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.3, 0.0, 63.53, 0.0, 0.0, 40.55, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0, 41.44, 0.0, 30.34, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 91.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.56], ["moo", 21.32], ["livestock, farm animals, working animals", 14.79]], [["speech", 24.41], ["cattle, bovinae", 10.49], ["moo", 9.48]], null, null, null, null, null, null, null, null, [["music", 69.61], ["musical instrument", 5.45], ["effects unit", 2.87]], null, null, null, null, [["speech", 26.01], ["breaking", 19.97], ["smash, crash", 6.83]], null, [["whack, thwack", 10.79], ["livestock, farm animals, working animals", 8.66], ["boing", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.83, 0.65, 7.34, 1.17, 5.45, 1.7, 0.85, 3.89, 2.45, 0.84, 1.3, 0.66, 0.24, 1.03, 0.84, 5.98, 0.02, 12.6, 0.66, 0.31, 1.48, 1.52, 2.01, 0.19, 8.44, 3.03, 1.28, 1.52, 1.0, 0.99, 1.58, 4.09, 1.28, 0.41, 4.03, 0.12, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/hZdl2FFp0eA_filtered.json b/annotations_filtered/hZdl2FFp0eA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..260a6397a3b4dc51c61c26a93161453e334397ad --- /dev/null +++ b/annotations_filtered/hZdl2FFp0eA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.81], [13.0, 13.61], [16.0, 16.56], [18.0, 20.97], [22.0, 22.62], [25.0, 24.68], [29.0, 31.83], [33.0, 37.1], [41.0, 41.25], [43.0, 44.02], [45.0, 46.68], [52.0, 53.37], [54.0, 54.45], [58.0, 59.05], [61.0, 62.26], [64.0, 67.61], [75.0, 76.1], [81.0, 81.31], [83.0, 83.93], [85.0, 85.31], [87.0, 88.37], [89.0, 89.88], [91.0, 92.25], [95.0, 95.07], [97.0, 97.95], [99.0, 100.7], [102.0, 105.38], [109.0, 110.67], [111.0, 112.01], [113.0, 132.43], [134.0, 134.87], [136.0, 135.87], [138.0, 138.57], [144.0, 144.93], [147.0, 147.63], [149.0, 150.65], [154.0, 154.38], [158.0, 157.71], [166.0, 166.56], [168.0, 168.89], [177.0, 176.54]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.68, 0.0, 0.0, 53.28, 41.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.31, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 27.41], ["synthesizer", 8.63], ["musical instrument", 4.75]], null, null, null, [["music", 31.8], ["synthesizer", 13.7], ["hum", 10.24]], null, null, null, null, null, null, null, [["music", 43.23], ["throbbing", 8.42], ["synthesizer", 6.21]], null, null, null, null, null, null, null, null, null, null, [["music", 36.51], ["hum", 20.06], ["ambient music", 6.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.61, 0.56, 2.97, 0.62, -0.32, 2.83, 4.1, 0.25, 1.02, 1.68, 1.37, 0.45, 1.05, 1.26, 3.61, 1.1, 0.31, 0.93, 0.31, 1.37, 0.88, 1.25, 0.07, 0.95, 1.7, 3.38, 1.67, 1.01, 19.43, 0.87, -0.13, 0.57, 0.93, 0.63, 1.65, 0.38, -0.29, 0.56, 0.89, -0.46]} \ No newline at end of file diff --git a/annotations_filtered/hZvud4MnaQ0_filtered.json b/annotations_filtered/hZvud4MnaQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef73b3da0ce680289af3ae6d1b20e4075e25d89 --- /dev/null +++ b/annotations_filtered/hZvud4MnaQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.4], [12.0, 11.75], [13.0, 13.19], [16.0, 17.0], [20.0, 20.46], [22.0, 22.92], [26.0, 27.75], [31.0, 33.84], [38.0, 46.9], [47.0, 48.27], [49.0, 49.62], [50.0, 51.24], [58.0, 79.17], [80.0, 82.78], [85.0, 86.12], [88.0, 88.3], [93.0, 96.03], [97.0, 98.32], [99.0, 101.58], [102.0, 102.24], [102.0, 105.56], [106.0, 108.53], [110.0, 114.45], [116.0, 124.19], [125.0, 135.99], [138.0, 143.77], [146.0, 147.16], [149.0, 150.06], [151.0, 151.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 32.35, 0.0, 0.0, 0.0, 28.47, 35.45, 0.0, 0.0, 86.82, 0.0, 98.1, 0.0, 68.67, 87.92, 76.37, 68.02, 63.42, 46.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.31], ["rumble", 6.58], ["speech", 5.59]], null, null, null, null, null, null, null, [["speech", 70.26], ["music", 12.47], ["breaking", 5.26]], null, null, null, [["hum", 40.87], ["throbbing", 22.56], ["mains hum", 20.06]], [["music", 41.98], ["musical instrument", 8.45], ["ambient music", 6.42]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.07], ["music", 20.1], ["speech", 15.23]], null, null, null], "duration": [4.4, -0.25, 0.19, 1.0, 0.46, 0.92, 1.75, 2.84, 8.9, 1.27, 0.62, 1.24, 21.17, 2.78, 1.12, 0.3, 3.03, 1.32, 2.58, 0.24, 3.56, 2.53, 4.45, 8.19, 10.99, 5.77, 1.16, 1.06, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/h_Awe6CI91k_filtered.json b/annotations_filtered/h_Awe6CI91k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5144ff0096a47b83209584b05c07df74d1e9b40 --- /dev/null +++ b/annotations_filtered/h_Awe6CI91k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [3.0, 3.37], [3.0, 7.1], [10.0, 11.21], [12.0, 13.31], [15.0, 14.74], [15.0, 15.55], [22.0, 22.64], [34.0, 38.43], [42.0, 43.14], [45.0, 45.71], [46.0, 63.48], [70.0, 71.76], [74.0, 75.61], [85.0, 85.45], [87.0, 87.05]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.55, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 0.0, 0.0, 34.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["moo", 38.14], ["livestock, farm animals, working animals", 30.6], ["cattle, bovinae", 22.66]], null, null, null, null, null, [["music", 26.06], ["cattle, bovinae", 18.28], ["livestock, farm animals, working animals", 17.5]], null, null, [["music", 61.89], ["hum", 6.88], ["theremin", 2.9]], null, null, null, null], "duration": [1.0, 0.37, 4.1, 1.21, 1.31, -0.26, 0.55, 0.64, 4.43, 1.14, 0.71, 17.48, 1.76, 1.61, 0.45, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/h_JeXTLSCQk_filtered.json b/annotations_filtered/h_JeXTLSCQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fda7d5c946e4b0afa46402afebed02b78548cbd5 --- /dev/null +++ b/annotations_filtered/h_JeXTLSCQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.99], [10.0, 9.96], [11.0, 11.67], [13.0, 20.56], [21.0, 21.98], [23.0, 23.08], [24.0, 29.39], [30.0, 34.32], [35.0, 36.42], [38.0, 38.62], [41.0, 44.95], [46.0, 47.02], [49.0, 50.85], [55.0, 55.34], [56.0, 56.61], [59.0, 61.4], [76.0, 124.17], [125.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 77.2, 100.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, -0.04, 0.67, 7.56, 0.98, 0.08, 5.39, 4.32, 1.42, 0.62, 3.95, 1.02, 1.85, 0.34, 0.61, 2.4, 48.17, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/h__j2aPe63w_filtered.json b/annotations_filtered/h__j2aPe63w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c61dcd55366e1d3a0fb499bdc10122f2bb27f9e --- /dev/null +++ b/annotations_filtered/h__j2aPe63w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [5.0, 7.37], [9.0, 9.96], [12.0, 12.43], [15.0, 17.46], [18.0, 31.55], [34.0, 41.17], [42.0, 67.63], [69.0, 98.09]], "keep_status": [false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 58.3, 0.0, 0.0, 64.63, 51.94, 37.18, 31.97, 34.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.34], ["mains hum", 20.12], ["hum", 18.57]], [["gong", 34.85], ["speech", 15.37], ["music", 11.44]], [["electric shaver, electric razor", 26.35], ["whack, thwack", 17.32], ["speech", 7.41]]], "duration": [1.11, 2.37, 0.96, 0.43, 2.46, 13.55, 7.17, 25.63, 29.09]} \ No newline at end of file diff --git a/annotations_filtered/h_bUcNjmuSk_filtered.json b/annotations_filtered/h_bUcNjmuSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..832f130a52e45041d164a0eba85f02dfc57528e6 --- /dev/null +++ b/annotations_filtered/h_bUcNjmuSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.57], [5.0, 6.54], [8.0, 8.36], [11.0, 13.2], [15.0, 17.68], [19.0, 19.74], [21.0, 21.42], [22.0, 23.04], [25.0, 28.46], [31.0, 30.86], [41.0, 45.3], [46.0, 47.49], [49.0, 49.23], [51.0, 52.29], [59.0, 59.04], [61.0, 61.79], [63.0, 64.72], [67.0, 70.65], [71.0, 80.87], [83.0, 86.54], [88.0, 90.07], [92.0, 93.75], [96.0, 95.82], [99.0, 100.45], [110.0, 114.51], [118.0, 128.8], [129.0, 130.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [91.98, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 99.62, 0.0, 0.0, 0.0, 53.91, 47.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["machine gun", 32.83], ["gunshot, gunfire", 13.06], ["speech", 12.36]], null], "duration": [2.57, 1.54, 0.36, 2.2, 2.68, 0.74, 0.42, 1.04, 3.46, -0.14, 4.3, 1.49, 0.23, 1.29, 0.04, 0.79, 1.72, 3.65, 9.87, 3.54, 2.07, 1.75, -0.18, 1.45, 4.51, 10.8, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/h_htCIiCXfE_filtered.json b/annotations_filtered/h_htCIiCXfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5df03cbbec2a29cec167244de222f5c41cd2984 --- /dev/null +++ b/annotations_filtered/h_htCIiCXfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.35], [14.0, 13.58], [19.0, 19.38], [24.0, 25.81], [29.0, 28.9], [31.0, 31.83], [35.0, 35.56], [38.0, 38.57], [39.0, 39.83], [41.0, 42.31], [44.0, 44.69], [47.0, 46.8], [50.0, 50.92], [53.0, 53.49], [57.0, 57.3], [58.0, 58.75], [65.0, 66.83], [68.0, 73.58], [76.0, 75.84], [79.0, 79.15], [81.0, 82.16], [87.0, 87.74], [107.0, 107.23], [109.0, 109.22], [112.0, 112.72], [113.0, 113.68], [116.0, 118.2], [120.0, 122.17], [125.0, 125.05], [128.0, 128.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 95.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, -0.42, 0.38, 1.81, -0.1, 0.83, 0.56, 0.57, 0.83, 1.31, 0.69, -0.2, 0.92, 0.49, 0.3, 0.75, 1.83, 5.58, -0.16, 0.15, 1.16, 0.74, 0.23, 0.22, 0.72, 0.68, 2.2, 2.17, 0.05, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/haX0ACElUQc_filtered.json b/annotations_filtered/haX0ACElUQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49545b65ffef7d847d7fe29899b5a41a15313706 --- /dev/null +++ b/annotations_filtered/haX0ACElUQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.22], [16.0, 22.37], [32.0, 33.54], [38.0, 38.1], [39.0, 39.73], [40.0, 40.14], [42.0, 46.43], [50.0, 50.18], [54.0, 54.77], [61.0, 68.35], [71.0, 71.66], [72.0, 73.09], [73.0, 74.49], [75.0, 76.37], [77.0, 84.1], [86.0, 86.86], [88.0, 98.07], [102.0, 103.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.44, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 38.68, 0.0, 32.37, 0.0], "audiomae_on_audioset": [null, [["speech", 35.92], ["tap", 15.64], ["clapping", 9.87]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.8], ["hum", 30.96], ["mains hum", 15.32]], null, [["hum", 39.68], ["mains hum", 36.23], ["white noise", 3.05]], null], "duration": [0.22, 6.37, 1.54, 0.1, 0.73, 0.14, 4.43, 0.18, 0.77, 7.35, 0.66, 1.09, 1.49, 1.37, 7.1, 0.86, 10.07, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/hajGYP3CLKo_filtered.json b/annotations_filtered/hajGYP3CLKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587228439f2a05c9b384a2af9eafeef329490192 --- /dev/null +++ b/annotations_filtered/hajGYP3CLKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [3.0, 3.35], [4.0, 4.78], [12.0, 12.72], [13.0, 55.93], [60.0, 63.95], [64.0, 64.3], [64.0, 64.34], [64.0, 82.31], [89.0, 92.94], [93.0, 93.11]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 57.4, 36.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.05], ["speech", 22.69], ["mains hum", 4.68]], null], "duration": [0.3, 0.35, 0.78, 0.72, 42.93, 3.95, 0.3, 0.34, 18.31, 3.94, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/hbDdiPNS3ck_filtered.json b/annotations_filtered/hbDdiPNS3ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa4a606c51e3a2f4494e1a3ce782f0bac85aa3c7 --- /dev/null +++ b/annotations_filtered/hbDdiPNS3ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [21.0, 28.48], [33.0, 33.42], [36.0, 36.42], [38.0, 38.33], [42.0, 41.96], [46.0, 45.96], [48.0, 49.03], [54.0, 54.6], [56.0, 57.01], [61.0, 60.76]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 13.14], ["throbbing", 11.0], ["breaking", 10.86]], null, null, null, null, null, null, null, null, null], "duration": [0.93, 7.48, 0.42, 0.42, 0.33, -0.04, -0.04, 1.03, 0.6, 1.01, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/hc0o1zXNHAg_filtered.json b/annotations_filtered/hc0o1zXNHAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d49335d1967e48f56b5dd58a9860cbe24b5c583 --- /dev/null +++ b/annotations_filtered/hc0o1zXNHAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [6.0, 7.48], [9.0, 16.19], [19.0, 21.15], [22.0, 23.08], [24.0, 24.39], [32.0, 32.78], [35.0, 36.61], [37.0, 39.66], [41.0, 44.05], [49.0, 49.1], [51.0, 55.44], [56.0, 58.58], [66.0, 67.34], [70.0, 71.93], [79.0, 80.45], [82.0, 82.31], [88.0, 88.62], [93.0, 94.68], [120.0, 121.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 89.54, 0.0, 96.29, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 1.48, 7.19, 2.15, 1.08, 0.39, 0.78, 1.61, 2.66, 3.05, 0.1, 4.44, 2.58, 1.34, 1.93, 1.45, 0.31, 0.62, 1.68, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/hc51ExPQJcQ_filtered.json b/annotations_filtered/hc51ExPQJcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e64e09a28002f57b25f942c88075e53f274b8d29 --- /dev/null +++ b/annotations_filtered/hc51ExPQJcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 23.3], [25.0, 30.96], [31.0, 34.47], [36.0, 38.8]], "keep_status": [false, true, false, false], "silence_prob": [42.76, 32.23, 40.31, 34.1], "audiomae_on_audioset": [[["music", 59.35], ["throbbing", 8.42], ["ambient music", 7.19]], [["music", 50.84], ["hum", 9.0], ["throbbing", 5.72]], [["music", 46.5], ["throbbing", 23.02], ["hum", 15.44]], [["music", 43.7], ["throbbing", 28.16], ["hum", 12.72]]], "duration": [20.3, 5.96, 3.47, 2.8]} \ No newline at end of file diff --git a/annotations_filtered/hcBF8zYH0s0_filtered.json b/annotations_filtered/hcBF8zYH0s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43d50d562948366898ce37f72a3b0295cd0e9193 --- /dev/null +++ b/annotations_filtered/hcBF8zYH0s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.73], [6.0, 27.55], [29.0, 30.05], [31.0, 32.17], [33.0, 34.1], [36.0, 35.92], [37.0, 43.87], [48.0, 62.72], [68.0, 67.8], [70.0, 70.34], [76.0, 93.6], [97.0, 112.7], [114.0, 114.52], [116.0, 116.58], [121.0, 124.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [50.86, 44.87, 0.0, 0.0, 0.0, 0.0, 36.71, 39.98, 0.0, 0.0, 33.45, 33.05, 0.0, 0.0, 93.13], "audiomae_on_audioset": [null, [["hum", 55.88], ["mains hum", 20.59], ["music", 7.26]], null, null, null, null, [["music", 60.35], ["speech", 9.14], ["hum", 3.23]], [["hum", 27.87], ["music", 25.6], ["mains hum", 14.45]], null, null, [["music", 41.06], ["animal", 6.21], ["hum", 4.43]], [["moo", 30.13], ["cattle, bovinae", 28.24], ["livestock, farm animals, working animals", 26.25]], null, null, null], "duration": [2.73, 21.55, 1.05, 1.17, 1.1, -0.08, 6.87, 14.72, -0.2, 0.34, 17.6, 15.7, 0.52, 0.58, 3.78]} \ No newline at end of file diff --git a/annotations_filtered/hcUVOlbNb30_filtered.json b/annotations_filtered/hcUVOlbNb30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..433f48d7870854ff5c334f631ee84a4996546e17 --- /dev/null +++ b/annotations_filtered/hcUVOlbNb30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.61], [15.0, 15.74], [18.0, 26.69], [28.0, 39.77], [41.0, 85.45], [86.0, 87.4]], "keep_status": [true, false, true, false, false, false], "silence_prob": [34.18, 0.0, 39.08, 37.21, 0.0, 0.0], "audiomae_on_audioset": [[["music", 23.06], ["whale vocalization", 18.47], ["livestock, farm animals, working animals", 7.74]], null, [["music", 31.83], ["throbbing", 13.8], ["hum", 12.86]], [["music", 34.72], ["speech", 31.14], ["hum", 4.66]], null, null], "duration": [12.61, 0.74, 8.69, 11.77, 44.45, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/hcWY1CYRCsw_filtered.json b/annotations_filtered/hcWY1CYRCsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37045782e42e9921f4742dab20efd3c717f1cbba --- /dev/null +++ b/annotations_filtered/hcWY1CYRCsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 37.49], [42.0, 43.09], [48.0, 48.66], [52.0, 68.28], [72.0, 92.25], [94.0, 100.38]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.41, 0.0, 0.0, 28.87, 31.65, 52.92], "audiomae_on_audioset": [[["music", 42.77], ["synthesizer", 9.65], ["hum", 8.61]], null, null, [["music", 36.64], ["speech", 34.95], ["fart", 2.1]], [["music", 48.54], ["sonar", 17.59], ["synthesizer", 4.04]], null], "duration": [14.49, 1.09, 0.66, 16.28, 20.25, 6.38]} \ No newline at end of file diff --git a/annotations_filtered/hcWo8KXmhLs_filtered.json b/annotations_filtered/hcWo8KXmhLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d149e0c753d0c80e133b9a773c4dd94e3436e20 --- /dev/null +++ b/annotations_filtered/hcWo8KXmhLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [6.0, 7.06], [8.0, 8.65], [11.0, 12.16], [13.0, 14.47], [15.0, 17.47], [19.0, 30.84], [38.0, 41.99], [42.0, 42.04], [48.0, 48.29], [49.0, 49.1], [51.0, 51.7], [62.0, 63.66], [66.0, 65.72], [70.0, 69.99], [74.0, 74.31], [90.0, 90.27], [97.0, 97.17], [100.0, 100.52], [104.0, 104.62], [105.0, 105.39], [107.0, 114.86], [120.0, 121.12], [123.0, 123.72], [136.0, 136.48], [138.0, 138.13], [150.0, 151.21], [167.0, 167.7]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.83, 33.27, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 35.15], ["speech", 10.56], ["theremin", 10.0]], [["music", 33.99], ["speech", 23.23], ["hum", 6.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.06, 0.65, 1.16, 1.47, 2.47, 11.84, 3.99, 0.04, 0.29, 0.1, 0.7, 1.66, -0.28, -0.01, 0.31, 0.27, 0.17, 0.52, 0.62, 0.39, 7.86, 1.12, 0.72, 0.48, 0.13, 1.21, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/hcb0vROvmWk_filtered.json b/annotations_filtered/hcb0vROvmWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e09e8d286fb55c7bf396154fb20c58a128d36d74 --- /dev/null +++ b/annotations_filtered/hcb0vROvmWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 45.55], [49.0, 50.28], [52.0, 90.44], [92.0, 106.52], [107.0, 107.59]], "keep_status": [false, false, false, true, false], "silence_prob": [30.53, 0.0, 0.0, 38.88, 0.0], "audiomae_on_audioset": [[["music", 56.92], ["boing", 30.71], ["echo", 1.58]], null, null, [["hum", 18.19], ["music", 15.01], ["fly, housefly", 12.62]], null], "duration": [9.55, 1.28, 38.44, 14.52, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/hck3C2VMRzk_filtered.json b/annotations_filtered/hck3C2VMRzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4aac57e2c000d1a2c4424163fc6b6b5e51917c3 --- /dev/null +++ b/annotations_filtered/hck3C2VMRzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.13], [10.0, 14.35], [24.0, 25.03], [28.0, 33.27], [41.0, 46.53], [51.0, 57.3], [58.0, 58.75], [71.0, 77.38], [81.0, 81.97], [89.0, 89.11], [99.0, 102.69], [107.0, 121.81], [124.0, 126.66], [127.0, 131.11]], "keep_status": [true, true, false, true, true, true, false, true, false, false, false, true, true, false], "silence_prob": [35.57, 35.16, 0.0, 31.04, 31.02, 30.4, 0.0, 33.14, 0.0, 0.0, 30.53, 30.3, 31.33, 31.06], "audiomae_on_audioset": [[["creak", 25.05], ["music", 9.17], ["smash, crash", 7.1]], [["music", 23.96], ["fly, housefly", 19.43], ["insect", 19.27]], null, [["music", 35.78], ["speech", 30.37], ["fart", 3.27]], [["music", 33.65], ["speech", 20.78], ["throbbing", 10.83]], [["speech", 37.93], ["music", 13.98], ["hum", 9.87]], null, [["music", 43.38], ["fly, housefly", 11.53], ["speech", 4.51]], null, null, [["music", 71.43], ["speech", 12.51], ["scratching (performance technique)", 3.31]], [["music", 48.52], ["tabla", 9.35], ["percussion", 5.9]], [["music", 22.19], ["fly, housefly", 13.33], ["boing", 12.65]], [["music", 58.17], ["thunk", 8.43], ["speech", 5.9]]], "duration": [3.13, 4.35, 1.03, 5.27, 5.53, 6.3, 0.75, 6.38, 0.97, 0.11, 3.69, 14.81, 2.66, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/hcvAwHA7usc_filtered.json b/annotations_filtered/hcvAwHA7usc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7bfc5c9360ff46c3d474a6de6f4e96c9e53795e --- /dev/null +++ b/annotations_filtered/hcvAwHA7usc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [4.0, 5.12], [6.0, 6.0], [7.0, 7.15], [8.0, 8.21], [9.0, 9.34], [11.0, 11.33], [18.0, 18.2], [29.0, 29.0], [31.0, 31.78], [37.0, 39.85], [42.0, 42.3], [48.0, 48.9], [50.0, 52.81], [54.0, 57.47], [61.0, 61.01], [62.0, 62.75], [64.0, 64.61], [73.0, 73.57], [75.0, 75.32], [79.0, 78.98], [80.0, 84.2], [85.0, 85.92], [104.0, 105.02], [106.0, 106.34], [111.0, 110.81], [112.0, 113.05], [114.0, 114.79], [117.0, 117.69], [120.0, 121.15], [124.0, 124.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 70.58, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.28, 1.12, 0.0, 0.15, 0.21, 0.34, 0.33, 0.2, 0.0, 0.78, 2.85, 0.3, 0.9, 2.81, 3.47, 0.01, 0.75, 0.61, 0.57, 0.32, -0.02, 4.2, 0.92, 1.02, 0.34, -0.19, 1.05, 0.79, 0.69, 1.15, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/hd521kE7f0A_filtered.json b/annotations_filtered/hd521kE7f0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00aa4a4bbd70d4de051022435163dcab25619213 --- /dev/null +++ b/annotations_filtered/hd521kE7f0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 131.67]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [56.67]} \ No newline at end of file diff --git a/annotations_filtered/hdIXrF34Bz0_filtered.json b/annotations_filtered/hdIXrF34Bz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..453734dbc0a7d4e4b03c9d53d465c9763bce2d6e --- /dev/null +++ b/annotations_filtered/hdIXrF34Bz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [10.0, 11.85], [14.0, 14.0], [15.0, 15.7], [19.0, 19.89], [23.0, 23.21], [27.0, 27.14], [33.0, 33.24], [37.0, 36.9], [43.0, 44.04], [45.0, 45.76], [48.0, 48.63], [50.0, 49.99], [52.0, 51.83], [53.0, 53.62], [56.0, 56.64], [58.0, 57.99], [62.0, 61.82], [65.0, 65.72], [68.0, 68.35], [71.0, 71.09], [72.0, 72.84], [82.0, 82.02], [84.0, 84.42], [87.0, 89.24], [91.0, 91.2], [95.0, 95.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 26.75], ["insect", 20.85], ["mosquito", 9.02]], null, null], "duration": [0.48, 1.85, 0.0, 0.7, 0.89, 0.21, 0.14, 0.24, -0.1, 1.04, 0.76, 0.63, -0.01, -0.17, 0.62, 0.64, -0.01, -0.18, 0.72, 0.35, 0.09, 0.84, 0.02, 0.42, 2.24, 0.2, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/hdQOL2aFufE_filtered.json b/annotations_filtered/hdQOL2aFufE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fdceb9e607de23aa08f9a6d226edc6752af1ab0 --- /dev/null +++ b/annotations_filtered/hdQOL2aFufE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [6.0, 6.99], [12.0, 12.43], [16.0, 16.12], [38.0, 38.42], [54.0, 54.53], [55.0, 55.78], [58.0, 58.82], [63.0, 64.35], [67.0, 67.41], [69.0, 69.2], [71.0, 71.73], [73.0, 73.77], [74.0, 76.4], [78.0, 78.48], [88.0, 88.48], [91.0, 91.57], [98.0, 98.25], [102.0, 102.96], [104.0, 103.87], [105.0, 105.29], [109.0, 109.32], [110.0, 110.98], [113.0, 113.95], [116.0, 115.96], [117.0, 118.62], [122.0, 122.17], [123.0, 124.61], [127.0, 127.92], [132.0, 133.27], [135.0, 136.16], [138.0, 140.78], [143.0, 144.48], [146.0, 147.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.99, 0.43, 0.12, 0.42, 0.53, 0.78, 0.82, 1.35, 0.41, 0.2, 0.73, 0.77, 2.4, 0.48, 0.48, 0.57, 0.25, 0.96, -0.13, 0.29, 0.32, 0.98, 0.95, -0.04, 1.62, 0.17, 1.61, 0.92, 1.27, 1.16, 2.78, 1.48, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/hdVQlYgFRuM_filtered.json b/annotations_filtered/hdVQlYgFRuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d02b991c500c141af9162168db99e60feeb3073 --- /dev/null +++ b/annotations_filtered/hdVQlYgFRuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.38], [9.0, 10.89], [18.0, 21.71], [25.0, 25.62], [27.0, 27.63], [29.0, 30.32], [31.0, 32.17], [35.0, 35.19], [37.0, 39.72], [45.0, 46.82], [61.0, 61.79], [64.0, 72.57], [74.0, 91.5], [92.0, 94.93], [100.0, 100.58], [101.0, 101.88], [103.0, 113.27], [114.0, 115.99], [117.0, 118.08], [119.0, 120.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 41.83, 31.86, 56.1, 0.0, 0.0, 34.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 79.08], ["musical instrument", 4.51], ["speech", 2.96]], [["music", 71.18], ["didgeridoo", 3.56], ["drum", 2.73]], null, null, null, [["music", 69.83], ["speech", 20.43], ["sidetone", 0.81]], null, null, null], "duration": [0.38, 1.89, 3.71, 0.62, 0.63, 1.32, 1.17, 0.19, 2.72, 1.82, 0.79, 8.57, 17.5, 2.93, 0.58, 0.88, 10.27, 1.99, 1.08, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/hdW1BlDtcyU_filtered.json b/annotations_filtered/hdW1BlDtcyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f129174cd61013222e92953a76ac73a84c069bfc --- /dev/null +++ b/annotations_filtered/hdW1BlDtcyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.65], [29.0, 30.69], [31.0, 55.12], [67.0, 67.47], [71.0, 79.47], [81.0, 81.63], [83.0, 83.69], [86.0, 87.76], [94.0, 94.2], [97.0, 97.7], [99.0, 108.31], [109.0, 110.35]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.55, 0.0, 36.5, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, [["music", 45.21], ["hum", 10.94], ["speech", 6.7]], null, [["speech", 74.25], ["mains hum", 7.65], ["hum", 2.69]], null, null, null, null, null, null, null], "duration": [0.65, 1.69, 24.12, 0.47, 8.47, 0.63, 0.69, 1.76, 0.2, 0.7, 9.31, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/hdaAD9fxKXA_filtered.json b/annotations_filtered/hdaAD9fxKXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f0fb5bf5e640499987e1deafc2336caeb938bf --- /dev/null +++ b/annotations_filtered/hdaAD9fxKXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 43.26], [63.0, 65.16], [80.0, 80.77], [91.0, 94.29], [100.0, 100.65], [101.0, 102.15], [108.0, 108.43], [110.0, 110.44], [114.0, 115.21]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.6, 0.0, 32.58, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 78.1], ["guitar", 3.66], ["musical instrument", 3.65]], null, [["music", 75.24], ["guitar", 7.63], ["musical instrument", 7.06]], null, null, null, null, null], "duration": [0.26, 2.16, 0.77, 3.29, 0.65, 1.15, 0.43, 0.44, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/hdhW0bChQwg_filtered.json b/annotations_filtered/hdhW0bChQwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f92e72d8e40be1d1bbbe485a75e8bb321d61d44e --- /dev/null +++ b/annotations_filtered/hdhW0bChQwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [4.0, 4.89], [6.0, 7.26], [9.0, 9.05], [11.0, 11.28], [14.0, 16.46], [19.0, 20.31], [23.0, 23.31], [25.0, 25.79], [27.0, 27.51], [31.0, 32.76], [34.0, 34.59], [36.0, 37.32], [38.0, 39.78], [41.0, 42.57], [43.0, 44.02], [45.0, 46.16], [47.0, 48.69], [50.0, 51.48], [53.0, 55.32], [59.0, 77.95], [80.0, 103.89], [107.0, 112.8], [115.0, 138.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 39.12, 48.52, 100.0, 99.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.31], ["animal", 12.6], ["cattle, bovinae", 7.81]], [["cattle, bovinae", 16.22], ["speech", 12.79], ["moo", 12.12]], null, null], "duration": [0.98, 0.89, 1.26, 0.05, 0.28, 2.46, 1.31, 0.31, 0.79, 0.51, 1.76, 0.59, 1.32, 1.78, 1.57, 1.02, 1.16, 1.69, 1.48, 2.32, 18.95, 23.89, 5.8, 23.5]} \ No newline at end of file diff --git a/annotations_filtered/hdnrorjl0WM_filtered.json b/annotations_filtered/hdnrorjl0WM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5858776ba293db95241a421df92462f3475a8b13 --- /dev/null +++ b/annotations_filtered/hdnrorjl0WM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.68], [23.0, 24.78], [31.0, 32.12], [37.0, 37.94], [42.0, 42.9], [44.0, 47.29], [49.0, 53.05], [54.0, 55.97], [57.0, 57.15], [58.0, 59.88], [61.0, 60.59], [61.0, 60.79], [62.0, 64.12], [65.0, 65.35], [68.0, 69.92], [71.0, 72.45], [77.0, 77.48], [79.0, 84.99], [89.0, 92.06], [95.0, 95.27], [96.0, 96.75], [99.0, 101.31], [105.0, 106.66], [114.0, 115.6], [117.0, 118.79], [121.0, 121.41], [127.0, 130.13], [132.0, 132.71], [137.0, 136.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 0.0, 0.0, 100.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 1.78, 1.12, 0.94, 0.9, 3.29, 4.05, 1.97, 0.15, 1.88, -0.41, -0.21, 2.12, 0.35, 1.92, 1.45, 0.48, 5.99, 3.06, 0.27, 0.75, 2.31, 1.66, 1.6, 1.79, 0.41, 3.13, 0.71, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/hdrvg0jmL8s_filtered.json b/annotations_filtered/hdrvg0jmL8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f24c2572af69da127ed38b26fe5b1f631f1afd2d --- /dev/null +++ b/annotations_filtered/hdrvg0jmL8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.79], [13.0, 14.91], [18.0, 21.96], [22.0, 23.3], [24.0, 24.88], [26.0, 27.33], [30.0, 30.77], [33.0, 33.78], [35.0, 36.49], [38.0, 38.5], [40.0, 41.37], [44.0, 44.47], [46.0, 47.06], [47.0, 48.02], [50.0, 50.45], [52.0, 53.03], [55.0, 56.03], [58.0, 61.52], [64.0, 65.08], [68.0, 68.3], [70.0, 71.39], [75.0, 75.36], [76.0, 82.19], [83.0, 84.18], [85.0, 86.0], [87.0, 90.68], [92.0, 100.21], [102.0, 104.38], [105.0, 105.88], [107.0, 108.06], [109.0, 110.46], [112.0, 113.21], [116.0, 117.12], [120.0, 122.45], [124.0, 126.25], [129.0, 129.71], [130.0, 130.08], [132.0, 132.39], [133.0, 133.95], [135.0, 136.8], [139.0, 139.58], [141.0, 141.93], [144.0, 146.06], [151.0, 151.17], [153.0, 153.5], [158.0, 158.92]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 50.41, 41.81, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 20.07], ["bee, wasp, etc.", 14.59], ["hum", 9.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.88], ["applause", 14.8], ["radio", 9.02]], null, null, null, [["hum", 23.93], ["music", 20.48], ["speech", 14.57]], [["music", 51.32], ["didgeridoo", 6.98], ["speech", 6.79]], null, null, null, null, null, [["music", 53.32], ["speech", 19.97], ["hum", 2.44]], [["music", 32.92], ["speech", 25.16], ["musical instrument", 3.21]], null, null, null, null, null, null, null, [["music", 32.13], ["didgeridoo", 28.07], ["fly, housefly", 8.72]], null, null, null], "duration": [0.79, 1.91, 3.96, 1.3, 0.88, 1.33, 0.77, 0.78, 1.49, 0.5, 1.37, 0.47, 1.06, 1.02, 0.45, 1.03, 1.03, 3.52, 1.08, 0.3, 1.39, 0.36, 6.19, 1.18, 1.0, 3.68, 8.21, 2.38, 0.88, 1.06, 1.46, 1.21, 1.12, 2.45, 2.25, 0.71, 0.08, 0.39, 0.95, 1.8, 0.58, 0.93, 2.06, 0.17, 0.5, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/hdt5QAIC81Q_filtered.json b/annotations_filtered/hdt5QAIC81Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bf6f339693debbfb94c414de1934adbd13724fe --- /dev/null +++ b/annotations_filtered/hdt5QAIC81Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [9.0, 11.84], [14.0, 14.45], [17.0, 17.54], [18.0, 18.52], [20.0, 21.02], [30.0, 38.03], [39.0, 42.03], [44.0, 43.88], [45.0, 47.11], [48.0, 49.62], [51.0, 52.07], [54.0, 54.58], [56.0, 57.92], [60.0, 61.18], [69.0, 70.36], [72.0, 74.65], [76.0, 80.11], [81.0, 82.31], [84.0, 85.55], [89.0, 90.48], [92.0, 93.46], [95.0, 95.17], [97.0, 98.39], [100.0, 101.56], [108.0, 109.63], [111.0, 112.99], [116.0, 118.1], [119.0, 119.69], [123.0, 124.04], [129.0, 133.27], [133.0, 133.3], [133.0, 133.44], [134.0, 133.61], [135.0, 142.92], [144.0, 144.8], [147.0, 149.01], [151.0, 153.42], [155.0, 155.22], [157.0, 158.4], [160.0, 161.3], [163.0, 165.82]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.33, 0.0, 0.0, 0.0, 0.0, 78.89, 81.35, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 37.74, 0.0, 0.0, 0.0, 88.64, 0.0, 95.91, 99.92, 0.0, 0.0, 0.0, 57.32], "audiomae_on_audioset": [null, [["whip", 20.67], ["whale vocalization", 10.83], ["speech", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 10.48], ["crushing", 9.12], ["whack, thwack", 8.44]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 2.84, 0.45, 0.54, 0.52, 1.02, 8.03, 3.03, -0.12, 2.11, 1.62, 1.07, 0.58, 1.92, 1.18, 1.36, 2.65, 4.11, 1.31, 1.55, 1.48, 1.46, 0.17, 1.39, 1.56, 1.63, 1.99, 2.1, 0.69, 1.04, 4.27, 0.3, 0.44, -0.39, 7.92, 0.8, 2.01, 2.42, 0.22, 1.4, 1.3, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/heeS8J_KFt4_filtered.json b/annotations_filtered/heeS8J_KFt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c06740686c15e33c913619ebf7d4d91a0799612f --- /dev/null +++ b/annotations_filtered/heeS8J_KFt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.03], [11.0, 11.85], [12.0, 13.39], [20.0, 21.02], [32.0, 31.99], [33.0, 35.09], [44.0, 44.46], [46.0, 58.4], [59.0, 61.53], [62.0, 63.61], [70.0, 70.88], [72.0, 72.47], [73.0, 73.58], [76.0, 76.65], [82.0, 81.94], [82.0, 83.71], [86.0, 86.7], [88.0, 88.62], [90.0, 92.06], [93.0, 94.56], [95.0, 96.28], [98.0, 98.96], [114.0, 115.55], [116.0, 118.79], [121.0, 121.24], [123.0, 124.24], [126.0, 129.64], [130.0, 136.27], [137.0, 139.41], [140.0, 141.51], [144.0, 144.98], [145.0, 146.26], [147.0, 153.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.9, 0.0, 57.48, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 92.48, 99.21, 97.83, 0.0, 0.0, 0.0, 76.7], "audiomae_on_audioset": [null, null, null, null, null, [["music", 55.13], ["speech", 24.32], ["electronic music", 2.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 0.85, 1.39, 1.02, -0.01, 2.09, 0.46, 12.4, 2.53, 1.61, 0.88, 0.47, 0.58, 0.65, -0.06, 1.71, 0.7, 0.62, 2.06, 1.56, 1.28, 0.96, 1.55, 2.79, 0.24, 1.24, 3.64, 6.27, 2.41, 1.51, 0.98, 1.26, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/hf1wQVWs0DA_filtered.json b/annotations_filtered/hf1wQVWs0DA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d1fd5f0c5c0eac33b5ca51fd1239ba8683aafb --- /dev/null +++ b/annotations_filtered/hf1wQVWs0DA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [4.0, 4.63], [8.0, 8.83], [15.0, 15.13], [18.0, 18.23], [19.0, 20.39], [21.0, 21.17], [23.0, 23.87], [25.0, 25.78], [28.0, 29.79], [31.0, 31.36], [33.0, 33.88], [34.0, 35.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.63, 0.83, 0.13, 0.23, 1.39, 0.17, 0.87, 0.78, 1.79, 0.36, 0.88, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/hfKhRRdMrVc_filtered.json b/annotations_filtered/hfKhRRdMrVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea49870ce8b88c1eaf4b05cf9983ae26271c31a8 --- /dev/null +++ b/annotations_filtered/hfKhRRdMrVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.64], [10.0, 11.04], [14.0, 19.94], [23.0, 23.73], [25.0, 28.36], [30.0, 32.31], [35.0, 36.53], [38.0, 38.31], [40.0, 42.25], [46.0, 50.23], [53.0, 54.45], [61.0, 62.34], [73.0, 73.21], [75.0, 75.05], [87.0, 87.56], [95.0, 97.51], [98.0, 106.44], [106.0, 106.62], [107.0, 106.91], [108.0, 113.58], [124.0, 124.56], [127.0, 128.73], [130.0, 129.9], [132.0, 132.09], [143.0, 143.45], [144.0, 146.57], [153.0, 153.62], [155.0, 155.46], [157.0, 157.72], [158.0, 158.97], [163.0, 165.79], [175.0, 175.69], [177.0, 178.29], [182.0, 187.22]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.94, 0.0, 100.0, 0.0, 44.18, 75.23, 0.0, 0.0, 49.31, 36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 31.16, 0.0, 0.0, 36.77, 0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 38.43, 0.0, 0.0, 57.4], "audiomae_on_audioset": [null, null, null, null, [["sine wave", 27.17], ["music", 17.07], ["chirp tone", 15.41]], null, null, null, [["speech", 76.54], ["music", 5.89], ["whale vocalization", 3.27]], [["whale vocalization", 86.23], ["music", 2.79], ["rumble", 1.66]], null, null, null, null, null, null, [["music", 29.47], ["didgeridoo", 14.82], ["sound effect", 8.49]], null, null, [["moo", 22.74], ["livestock, farm animals, working animals", 22.47], ["cattle, bovinae", 20.67]], null, null, null, null, null, null, null, null, null, null, [["speech", 58.27], ["radio", 11.73], ["animal", 5.44]], null, null, null], "duration": [4.64, 1.04, 5.94, 0.73, 3.36, 2.31, 1.53, 0.31, 2.25, 4.23, 1.45, 1.34, 0.21, 0.05, 0.56, 2.51, 8.44, 0.62, -0.09, 5.58, 0.56, 1.73, -0.1, 0.09, 0.45, 2.57, 0.62, 0.46, 0.72, 0.97, 2.79, 0.69, 1.29, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/hfNlv4HLZ5k_filtered.json b/annotations_filtered/hfNlv4HLZ5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1696f38f44983753c248e21a3b1bd5e7b6e6c28e --- /dev/null +++ b/annotations_filtered/hfNlv4HLZ5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.05], [14.0, 15.35], [17.0, 17.88], [19.0, 20.38], [21.0, 22.99], [23.0, 24.21], [28.0, 29.98], [32.0, 33.29], [34.0, 37.71], [38.0, 47.48], [49.0, 51.29], [53.0, 55.09], [56.0, 56.13], [57.0, 57.87], [59.0, 60.35], [63.0, 64.02], [66.0, 67.07], [68.0, 68.86], [70.0, 70.33], [71.0, 72.18], [74.0, 76.03], [77.0, 80.1], [82.0, 83.27], [85.0, 86.9], [87.0, 93.6], [95.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 50.02, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 98.19, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["dial tone", 44.93], ["busy signal", 9.39], ["speech", 6.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.35, 0.88, 1.38, 1.99, 1.21, 1.98, 1.29, 3.71, 9.48, 2.29, 2.09, 0.13, 0.87, 1.35, 1.02, 1.07, 0.86, 0.33, 1.18, 2.03, 3.1, 1.27, 1.9, 6.6, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/hfNvGT9X-7Q_filtered.json b/annotations_filtered/hfNvGT9X-7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c06e15fa70a84d1786d5831215be2c0e66a702d --- /dev/null +++ b/annotations_filtered/hfNvGT9X-7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 92.53]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [49.53]} \ No newline at end of file diff --git a/annotations_filtered/hfOL-PefOz4_filtered.json b/annotations_filtered/hfOL-PefOz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b41a24f66c70636405db53217941d83513b99b3 --- /dev/null +++ b/annotations_filtered/hfOL-PefOz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.18], [15.0, 15.28], [19.0, 21.03], [23.0, 26.43], [31.0, 33.67], [34.0, 35.45], [36.0, 37.54], [41.0, 56.89], [57.0, 58.26], [60.0, 61.13], [61.0, 61.84], [62.0, 65.99], [67.0, 68.22], [69.0, 70.77], [76.0, 84.59], [87.0, 88.94], [92.0, 93.82], [96.0, 97.51], [101.0, 101.43], [103.0, 102.69], [108.0, 108.63], [112.0, 112.45], [113.0, 172.39], [173.0, 173.15], [173.0, 173.28], [173.0, 178.68]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 86.27, 66.76, 82.61, 0.0, 0.0, 36.07, 0.0, 0.0, 0.0, 40.28, 0.0, 0.0, 30.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 29.37], ["hum", 15.76], ["music", 13.63]], null, null, null, [["speech", 28.33], ["hum", 25.42], ["rumble", 13.24]], null, null, [["music", 35.71], ["speech", 30.95], ["explosion", 6.72]], null, null, null, null, null, null, null, null, null, null, [["mains hum", 25.52], ["hum", 23.33], ["music", 13.34]]], "duration": [0.18, 0.28, 2.03, 3.43, 2.67, 1.45, 1.54, 15.89, 1.26, 1.13, 0.84, 3.99, 1.22, 1.77, 8.59, 1.94, 1.82, 1.51, 0.43, -0.31, 0.63, 0.45, 59.39, 0.15, 0.28, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/hfW-fzTbpRg_filtered.json b/annotations_filtered/hfW-fzTbpRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..618968d15a4364f11349b75866ba7a985716079f --- /dev/null +++ b/annotations_filtered/hfW-fzTbpRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.28], [15.0, 14.94], [20.0, 40.9], [45.0, 49.42], [52.0, 54.45], [56.0, 59.93], [69.0, 70.63], [72.0, 72.49], [79.0, 81.08], [82.0, 84.74], [90.0, 90.86], [95.0, 107.3], [108.0, 108.45]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [47.43, 0.0, 37.33, 37.82, 52.86, 51.5, 0.0, 0.0, 66.63, 88.64, 0.0, 41.3, 0.0], "audiomae_on_audioset": [[["music", 40.81], ["wind instrument, woodwind instrument", 15.97], ["musical instrument", 9.84]], null, [["music", 68.41], ["theremin", 10.09], ["didgeridoo", 5.03]], [["music", 30.22], ["trombone", 12.56], ["theremin", 11.25]], null, null, null, null, null, null, null, [["speech", 67.94], ["music", 9.69], ["breaking", 3.26]], null], "duration": [6.28, -0.06, 20.9, 4.42, 2.45, 3.93, 1.63, 0.49, 2.08, 2.74, 0.86, 12.3, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/hfufT3MZQm8_filtered.json b/annotations_filtered/hfufT3MZQm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49723bfaf613f68acd26c10f1fe19fc3d8e57a90 --- /dev/null +++ b/annotations_filtered/hfufT3MZQm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.26], [17.0, 16.8], [21.0, 24.88], [31.0, 35.18], [37.0, 37.79], [38.0, 39.16], [43.0, 44.34], [46.0, 47.78], [49.0, 49.5], [51.0, 51.75], [66.0, 70.38], [71.0, 73.38], [78.0, 78.44], [80.0, 80.54], [83.0, 84.94], [90.0, 90.1], [92.0, 93.28], [94.0, 95.25], [96.0, 98.17], [101.0, 100.97], [104.0, 105.04], [107.0, 107.57], [108.0, 111.86], [114.0, 115.25], [117.0, 117.31], [120.0, 121.24], [124.0, 125.58], [128.0, 128.7], [132.0, 133.25], [141.0, 146.01], [147.0, 147.82], [149.0, 151.56], [153.0, 153.12], [155.0, 156.76], [158.0, 159.78], [166.0, 169.99], [178.0, 178.07]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [32.13, 0.0, 31.94, 32.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9, 34.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.78, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.53, 0.0, 38.55, 0.0, 0.0, 0.0, 31.94, 0.0], "audiomae_on_audioset": [[["harmonica", 25.59], ["wind instrument, woodwind instrument", 13.59], ["music", 10.97]], null, [["music", 56.67], ["musical instrument", 4.27], ["didgeridoo", 3.06]], [["music", 45.34], ["didgeridoo", 9.46], ["musical instrument", 6.26]], null, null, null, null, null, null, [["sidetone", 38.8], ["music", 24.23], ["speech", 7.27]], [["didgeridoo", 29.2], ["music", 15.33], ["fly, housefly", 9.31]], null, null, null, null, null, null, [["music", 12.2], ["sidetone", 9.26], ["noise", 6.02]], null, null, null, [["music", 49.32], ["boing", 16.32], ["speech", 6.01]], null, null, null, null, null, null, [["speech", 40.82], ["stomach rumble", 8.6], ["fart", 4.72]], null, [["speech", 32.14], ["radio", 13.13], ["frog", 3.32]], null, null, null, [["music", 62.36], ["sidetone", 14.12], ["speech", 2.44]], null], "duration": [3.26, -0.2, 3.88, 4.18, 0.79, 1.16, 1.34, 1.78, 0.5, 0.75, 4.38, 2.38, 0.44, 0.54, 1.94, 0.1, 1.28, 1.25, 2.17, -0.03, 1.04, 0.57, 3.86, 1.25, 0.31, 1.24, 1.58, 0.7, 1.25, 5.01, 0.82, 2.56, 0.12, 1.76, 1.78, 3.99, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/hfzsR-3PLcg_filtered.json b/annotations_filtered/hfzsR-3PLcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73caf0da8920f660d32f7904eef9886b2a01a46b --- /dev/null +++ b/annotations_filtered/hfzsR-3PLcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [9.0, 10.03], [12.0, 12.29], [13.0, 14.22], [17.0, 18.84], [20.0, 20.92], [27.0, 33.29], [34.0, 33.88], [35.0, 35.14], [44.0, 45.81], [50.0, 55.0], [60.0, 60.4], [61.0, 63.53], [64.0, 84.65]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0, 60.51, 0.0, 34.93, 33.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 23.62], ["speech", 19.08], ["hum", 11.88]], null, null, null, null, null, [["fart", 80.08], ["music", 6.38], ["musical instrument", 0.97]], [["music", 59.13], ["speech", 19.56], ["musical instrument", 3.1]]], "duration": [0.38, 1.03, 0.29, 1.22, 1.84, 0.92, 6.29, -0.12, 0.14, 1.81, 5.0, 0.4, 2.53, 20.65]} \ No newline at end of file diff --git a/annotations_filtered/hgCr8TOxcCo_filtered.json b/annotations_filtered/hgCr8TOxcCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e16d0aa10e440d4979f3a958ab2a5223b1d0a6b --- /dev/null +++ b/annotations_filtered/hgCr8TOxcCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 88.94]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [36.94]} \ No newline at end of file diff --git a/annotations_filtered/hgFClV33aH0_filtered.json b/annotations_filtered/hgFClV33aH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8e49977d8609db7ab24bbc9b2a5b0bf33aef33 --- /dev/null +++ b/annotations_filtered/hgFClV33aH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.29], [29.0, 36.0], [37.0, 41.1], [41.0, 44.09], [46.0, 46.63], [49.0, 51.75], [53.0, 53.49], [54.0, 54.77], [56.0, 56.05], [57.0, 57.38], [59.0, 59.85], [60.0, 60.69], [63.0, 64.57], [73.0, 74.01], [79.0, 86.63], [88.0, 90.34]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.8, 81.53, 49.13, 0.0, 37.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 39.98], "audiomae_on_audioset": [null, [["music", 61.84], ["speech", 19.22], ["drum machine", 2.11]], null, [["speech", 55.56], ["sidetone", 16.87], ["music", 6.57]], null, [["speech", 41.27], ["frog", 12.13], ["croak", 9.91]], null, null, null, null, null, null, null, null, null, [["speech", 36.44], ["sidetone", 19.12], ["music", 18.06]]], "duration": [0.29, 7.0, 4.1, 3.09, 0.63, 2.75, 0.49, 0.77, 0.05, 0.38, 0.85, 0.69, 1.57, 1.01, 7.63, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/hgGi1ODlBBo_filtered.json b/annotations_filtered/hgGi1ODlBBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd74cedc989df879e73ec6e71e88822fcbaf935c --- /dev/null +++ b/annotations_filtered/hgGi1ODlBBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.5], [12.0, 13.0], [15.0, 16.29], [19.0, 21.56], [23.0, 24.58], [26.0, 27.97], [30.0, 32.71], [34.0, 34.65], [39.0, 43.97], [47.0, 48.78], [51.0, 61.28], [63.0, 67.37], [68.0, 87.76], [88.0, 95.44], [98.0, 144.51]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, true, false], "silence_prob": [40.28, 0.0, 0.0, 35.35, 0.0, 0.0, 55.6, 0.0, 29.69, 0.0, 28.47, 29.16, 29.05, 28.62, 0.0], "audiomae_on_audioset": [[["coin (dropping)", 67.94], ["music", 12.48], ["breaking", 6.62]], null, null, [["music", 32.63], ["mains hum", 22.35], ["hum", 20.51]], null, null, null, null, [["music", 41.23], ["didgeridoo", 13.99], ["speech", 6.05]], null, [["music", 28.9], ["mains hum", 13.7], ["hum", 12.8]], [["music", 28.97], ["mains hum", 16.52], ["hum", 15.36]], [["music", 52.31], ["speech", 22.87], ["throbbing", 5.77]], [["music", 52.24], ["hum", 6.2], ["mains hum", 5.89]], null], "duration": [5.5, 1.0, 1.29, 2.56, 1.58, 1.97, 2.71, 0.65, 4.97, 1.78, 10.28, 4.37, 19.76, 7.44, 46.51]} \ No newline at end of file diff --git a/annotations_filtered/hgLkypdC6wo_filtered.json b/annotations_filtered/hgLkypdC6wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2cccc736f739b937a226b768c7bde417482f2a --- /dev/null +++ b/annotations_filtered/hgLkypdC6wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 22.57], [23.0, 24.75], [26.0, 38.48], [43.0, 44.58], [45.0, 85.83], [88.0, 91.17], [93.0, 97.44], [98.0, 98.96], [100.0, 100.33], [102.0, 103.57], [107.0, 107.18], [110.0, 109.85], [112.0, 112.77], [113.0, 113.81]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [37.74, 0.0, 36.02, 0.0, 0.0, 38.32, 39.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.96], ["speech", 19.98], ["sidetone", 4.09]], null, [["music", 46.35], ["speech", 8.35], ["radio", 4.48]], null, null, [["music", 37.33], ["whip", 5.23], ["rattle (instrument)", 5.18]], [["music", 49.94], ["synthesizer", 6.3], ["hum", 5.12]], null, null, null, null, null, null, null], "duration": [16.57, 1.75, 12.48, 1.58, 40.83, 3.17, 4.44, 0.96, 0.33, 1.57, 0.18, -0.15, 0.77, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/hghczTVgav0_filtered.json b/annotations_filtered/hghczTVgav0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..898155b20dcd9808aa35e75a9955173cccf356cb --- /dev/null +++ b/annotations_filtered/hghczTVgav0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [8.0, 10.23], [13.0, 14.52], [15.0, 16.43], [18.0, 19.21], [21.0, 20.95], [21.0, 22.44], [25.0, 25.73], [29.0, 29.08], [33.0, 34.55], [38.0, 39.65], [42.0, 42.8], [45.0, 45.5], [46.0, 47.04], [48.0, 48.14], [53.0, 54.08], [55.0, 56.67], [58.0, 59.31], [61.0, 63.05], [64.0, 65.69], [66.0, 67.0], [68.0, 68.55], [70.0, 69.87], [73.0, 85.53], [86.0, 93.39], [94.0, 94.51], [96.0, 98.44], [101.0, 103.69], [105.0, 105.26], [108.0, 108.62], [109.0, 109.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false, false], "silence_prob": [0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 39.64, 37.95, 0.0, 44.49, 36.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.09], ["sidetone", 22.1], ["speech", 8.58]], [["speech", 42.35], ["music", 6.57], ["beatboxing", 4.14]], null, [["chirp tone", 12.19], ["noise", 10.38], ["hum", 9.77]], [["whip", 16.02], ["explosion", 15.01], ["hum", 6.87]], null, null, null], "duration": [1.04, 2.23, 1.52, 1.43, 1.21, -0.05, 1.44, 0.73, 0.08, 1.55, 1.65, 0.8, 0.5, 1.04, 0.14, 1.08, 1.67, 1.31, 2.05, 1.69, 1.0, 0.55, -0.13, 12.53, 7.39, 0.51, 2.44, 2.69, 0.26, 0.62, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/hgqJjr7pBa0_filtered.json b/annotations_filtered/hgqJjr7pBa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f2bd388d8350c01e91e2bf983aa09dcaaf2574 --- /dev/null +++ b/annotations_filtered/hgqJjr7pBa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.56], [8.0, 7.57], [11.0, 11.04], [16.0, 16.06], [27.0, 30.97], [31.0, 33.79], [35.0, 39.56], [40.0, 41.64], [42.0, 43.92], [46.0, 46.04], [48.0, 48.69], [50.0, 53.5], [55.0, 55.41], [56.0, 66.97], [69.0, 70.68], [71.0, 72.01], [73.0, 74.22], [77.0, 78.43], [84.0, 84.99], [86.0, 87.69], [88.0, 89.04], [97.0, 97.55], [99.0, 110.02], [111.0, 111.16], [112.0, 129.05], [130.0, 131.53]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 32.81, 36.18, 36.77, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1, 0.0, 29.65, 0.0], "audiomae_on_audioset": [[["speech", 20.83], ["music", 16.84], ["didgeridoo", 13.91]], null, null, null, [["hum", 28.64], ["mains hum", 15.4], ["speech", 14.98]], [["speech", 64.93], ["mains hum", 8.5], ["hum", 6.86]], [["speech", 17.91], ["hum", 11.94], ["mains hum", 11.26]], null, null, null, null, [["music", 43.62], ["didgeridoo", 13.7], ["musical instrument", 5.44]], null, [["speech", 37.34], ["music", 35.46], ["electronic music", 2.31]], null, null, null, null, null, null, null, null, [["music", 47.06], ["scary music", 13.23], ["ambient music", 9.0]], null, [["hum", 38.96], ["throbbing", 35.1], ["mains hum", 9.27]], null], "duration": [2.56, -0.43, 0.04, 0.06, 3.97, 2.79, 4.56, 1.64, 1.92, 0.04, 0.69, 3.5, 0.41, 10.97, 1.68, 1.01, 1.22, 1.43, 0.99, 1.69, 1.04, 0.55, 11.02, 0.16, 17.05, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/hgzSTQiMxj4_filtered.json b/annotations_filtered/hgzSTQiMxj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1816883ffcad42e6bf9b9c5b0d74043eae261918 --- /dev/null +++ b/annotations_filtered/hgzSTQiMxj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.5], [14.0, 15.11], [17.0, 17.19], [22.0, 24.85], [28.0, 27.94], [30.0, 31.4], [34.0, 34.25], [38.0, 38.82], [43.0, 44.58], [70.0, 73.95], [74.0, 82.24], [83.0, 85.48], [87.0, 89.94], [90.0, 91.34], [92.0, 92.2], [99.0, 103.57]], "keep_status": [true, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [32.48, 0.0, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 0.0, 31.6, 33.53, 77.03, 85.35, 0.0, 0.0, 74.6], "audiomae_on_audioset": [[["mains hum", 31.01], ["speech", 21.08], ["hum", 15.64]], null, null, [["electric shaver, electric razor", 36.25], ["speech", 14.97], ["noise", 9.51]], null, null, null, null, null, [["livestock, farm animals, working animals", 25.89], ["animal", 20.52], ["domestic animals, pets", 14.15]], [["speech", 23.25], ["insect", 18.6], ["fly, housefly", 14.29]], null, null, null, null, null], "duration": [5.5, 1.11, 0.19, 2.85, -0.06, 1.4, 0.25, 0.82, 1.58, 3.95, 8.24, 2.48, 2.94, 1.34, 0.2, 4.57]} \ No newline at end of file diff --git a/annotations_filtered/hh5iOitreQ8_filtered.json b/annotations_filtered/hh5iOitreQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b61da0b5ac2f70aea3ad6828c33492b372b4703 --- /dev/null +++ b/annotations_filtered/hh5iOitreQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 24.33], [35.0, 35.9], [40.0, 47.16], [48.0, 50.03], [54.0, 81.13], [82.0, 82.49], [85.0, 84.96], [87.0, 87.51], [90.0, 90.46], [95.0, 97.87], [99.0, 100.38], [101.0, 103.89], [108.0, 108.53], [109.0, 110.03], [113.0, 113.59], [114.0, 114.47], [118.0, 133.69], [134.0, 142.06]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [31.74, 0.0, 31.24, 34.68, 31.15, 0.0, 0.0, 0.0, 0.0, 31.5, 0.0, 30.22, 0.0, 0.0, 0.0, 0.0, 31.04, 31.18], "audiomae_on_audioset": [[["music", 59.1], ["musical instrument", 14.44], ["didgeridoo", 8.28]], null, [["music", 72.05], ["musical instrument", 6.71], ["theremin", 4.35]], [["music", 78.48], ["didgeridoo", 6.8], ["musical instrument", 5.03]], [["music", 39.92], ["trombone", 24.58], ["brass instrument", 17.01]], null, null, null, null, [["music", 46.24], ["theremin", 9.29], ["musical instrument", 4.41]], null, [["theremin", 62.59], ["music", 28.46], ["musical instrument", 1.58]], null, null, null, null, [["music", 55.85], ["noise", 6.57], ["musical instrument", 5.62]], [["music", 42.5], ["didgeridoo", 23.36], ["trombone", 4.68]]], "duration": [20.33, 0.9, 7.16, 2.03, 27.13, 0.49, -0.04, 0.51, 0.46, 2.87, 1.38, 2.89, 0.53, 1.03, 0.59, 0.47, 15.69, 8.06]} \ No newline at end of file diff --git a/annotations_filtered/hhGWxqj_bC0_filtered.json b/annotations_filtered/hhGWxqj_bC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38c2668f19d377421d8c5383e3042035726d6704 --- /dev/null +++ b/annotations_filtered/hhGWxqj_bC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.45], [17.0, 25.12], [27.0, 27.65], [31.0, 33.47], [34.0, 35.38], [36.0, 38.45], [40.0, 40.69], [44.0, 64.67], [66.0, 105.02]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 61.27, 0.0, 97.54, 0.0, 99.71, 0.0, 30.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 13.88], ["mains hum", 8.55], ["vehicle", 8.48]], null], "duration": [0.45, 8.12, 0.65, 2.47, 1.38, 2.45, 0.69, 20.67, 39.02]} \ No newline at end of file diff --git a/annotations_filtered/hhRIhD6BvMo_filtered.json b/annotations_filtered/hhRIhD6BvMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94ed24f7a07577925032c5d410cd53e8a29fbe1d --- /dev/null +++ b/annotations_filtered/hhRIhD6BvMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 4.72], [6.0, 8.01], [13.0, 13.41], [20.0, 21.81], [25.0, 25.91], [29.0, 30.82], [31.0, 31.06], [31.0, 33.52], [38.0, 38.8], [44.0, 43.73], [47.0, 48.24], [60.0, 60.45], [61.0, 64.74], [65.0, 64.84], [65.0, 64.88], [65.0, 65.01], [65.0, 65.04], [65.0, 65.08], [66.0, 69.5], [73.0, 74.33], [79.0, 79.54], [80.0, 80.15], [87.0, 87.1], [87.0, 87.69], [91.0, 94.04], [96.0, 96.31], [97.0, 98.66], [105.0, 106.14], [108.0, 110.57], [112.0, 113.7], [117.0, 119.6], [122.0, 124.34], [125.0, 128.06], [132.0, 132.76], [133.0, 139.75], [143.0, 144.22], [146.0, 150.38], [151.0, 151.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 58.89, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 52.39, 0.0, 83.7, 73.36, 71.87, 0.0, 31.99, 0.0, 34.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.85], ["double bass", 21.23], ["cello", 16.04]], null, [["music", 32.41], ["bee, wasp, etc.", 10.7], ["fly, housefly", 9.25]], null], "duration": [1.1, 1.72, 2.01, 0.41, 1.81, 0.91, 1.82, 0.06, 2.52, 0.8, -0.27, 1.24, 0.45, 3.74, -0.16, -0.12, 0.01, 0.04, 0.08, 3.5, 1.33, 0.54, 0.15, 0.1, 0.69, 3.04, 0.31, 1.66, 1.14, 2.57, 1.7, 2.6, 2.34, 3.06, 0.76, 6.75, 1.22, 4.38, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/hhmPqQpJWks_filtered.json b/annotations_filtered/hhmPqQpJWks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ccd3dfd76ca89cbbbdaaaef910f5eb1fd13c7d --- /dev/null +++ b/annotations_filtered/hhmPqQpJWks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.26], [20.0, 20.43], [23.0, 23.36], [25.0, 25.39], [29.0, 36.1], [41.0, 41.93], [45.0, 45.03], [45.0, 47.63], [55.0, 55.81], [60.0, 60.57], [67.0, 68.96], [73.0, 73.38], [74.0, 75.39], [78.0, 78.88], [80.0, 80.86], [108.0, 112.04], [112.0, 113.1], [119.0, 120.56], [122.0, 123.09], [123.0, 124.98], [125.0, 127.94], [128.0, 130.5]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.17, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.09, 0.0, 0.0, 0.0, 0.0, 84.43, 57.72], "audiomae_on_audioset": [null, null, null, null, [["thump, thud", 23.04], ["throbbing", 14.0], ["whack, thwack", 10.4]], null, null, [["speech", 27.38], ["bee, wasp, etc.", 8.44], ["fly, housefly", 7.5]], null, null, null, null, null, null, null, [["speech", 66.53], ["noise", 7.52], ["sidetone", 4.39]], null, null, null, null, null, null], "duration": [0.26, 0.43, 0.36, 0.39, 7.1, 0.93, 0.03, 2.63, 0.81, 0.57, 1.96, 0.38, 1.39, 0.88, 0.86, 4.04, 1.1, 1.56, 1.09, 1.98, 2.94, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/hiHZWeeoEUg_filtered.json b/annotations_filtered/hiHZWeeoEUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5d5429b81d508df3abb2da83069f57cd899196a --- /dev/null +++ b/annotations_filtered/hiHZWeeoEUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [7.0, 13.71], [15.0, 15.16], [15.0, 18.45], [20.0, 20.58], [23.0, 23.04], [30.0, 29.94], [33.0, 33.57], [38.0, 38.62], [42.0, 43.24], [46.0, 46.84], [48.0, 48.14], [53.0, 54.65], [56.0, 56.37], [59.0, 59.76], [63.0, 64.25], [67.0, 67.85], [70.0, 85.82], [87.0, 96.28], [103.0, 107.57], [110.0, 111.01], [112.0, 117.48], [118.0, 118.03], [120.0, 140.14], [144.0, 146.48]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 34.02, 0.0, 38.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.26, 31.86, 31.39, 0.0, 31.62, 0.0, 28.52, 28.52], "audiomae_on_audioset": [null, [["sidetone", 34.47], ["music", 14.29], ["hum", 13.17]], null, [["music", 52.98], ["speech", 6.35], ["theremin", 5.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.3], ["speech", 20.75], ["throbbing", 13.5]], [["music", 28.63], ["livestock, farm animals, working animals", 13.43], ["cattle, bovinae", 13.02]], [["theremin", 46.47], ["music", 25.9], ["musical instrument", 5.41]], null, [["music", 63.94], ["trombone", 8.36], ["brass instrument", 6.84]], null, [["speech", 38.16], ["music", 33.42], ["explosion", 6.41]], [["speech", 31.49], ["music", 25.87], ["sound effect", 4.72]]], "duration": [0.56, 6.71, 0.16, 3.45, 0.58, 0.04, -0.06, 0.57, 0.62, 1.24, 0.84, 0.14, 1.65, 0.37, 0.76, 1.25, 0.85, 15.82, 9.28, 4.57, 1.01, 5.48, 0.03, 20.14, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/hiREoiox0Tw_filtered.json b/annotations_filtered/hiREoiox0Tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..385fddd93041be124207a89a7250d102ab73a478 --- /dev/null +++ b/annotations_filtered/hiREoiox0Tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [4.0, 4.6], [9.0, 11.7], [18.0, 19.6], [22.0, 25.0], [26.0, 27.01], [38.0, 47.06], [48.0, 50.06], [51.0, 59.19], [60.0, 93.93], [95.0, 97.01], [104.0, 105.44], [106.0, 107.47], [109.0, 109.9], [111.0, 111.94], [113.0, 117.02], [122.0, 122.96], [124.0, 125.93], [127.0, 128.09], [128.0, 129.17], [130.0, 130.44], [131.0, 133.56], [135.0, 135.99], [138.0, 144.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.03, 0.0, 79.07, 0.0, 85.72, 99.73, 95.37, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 52.1, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.6, 2.7, 1.6, 3.0, 1.01, 9.06, 2.06, 8.19, 33.93, 2.01, 1.44, 1.47, 0.9, 0.94, 4.02, 0.96, 1.93, 1.09, 1.17, 0.44, 2.56, 0.99, 6.39]} \ No newline at end of file diff --git a/annotations_filtered/hiq_FE5dmWI_filtered.json b/annotations_filtered/hiq_FE5dmWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd9f5e13667734b35205aedffff2196fb75de0ed --- /dev/null +++ b/annotations_filtered/hiq_FE5dmWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 78.07], [81.0, 81.46], [83.0, 83.15], [85.0, 84.79]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [30.07, 0.46, 0.15, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/hjhBzRH-plo_filtered.json b/annotations_filtered/hjhBzRH-plo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1406b20e0476b73406b0e3b883202235c5379de --- /dev/null +++ b/annotations_filtered/hjhBzRH-plo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.19], [12.0, 13.31], [15.0, 15.08], [15.0, 15.67], [17.0, 18.39], [19.0, 22.98], [27.0, 27.23], [42.0, 42.01], [45.0, 45.47], [51.0, 53.86], [54.0, 54.7], [56.0, 56.76], [58.0, 58.85], [60.0, 60.29], [63.0, 64.0], [70.0, 72.42], [74.0, 74.34], [76.0, 75.59], [80.0, 81.08], [83.0, 83.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 33.38, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["boing", 44.36], ["animal", 19.35], ["grunt", 7.32]], null, null, null, null, null, [["wail, moan", 9.35], ["groan", 6.78], ["honk", 6.53]], null, null, null, null], "duration": [0.19, 1.31, 0.08, 0.67, 1.39, 3.98, 0.23, 0.01, 0.47, 2.86, 0.7, 0.76, 0.85, 0.29, 1.0, 2.42, 0.34, -0.41, 1.08, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/hjuYfeA2prM_filtered.json b/annotations_filtered/hjuYfeA2prM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41eba648742f20b055a982140e46f1287cd0d44f --- /dev/null +++ b/annotations_filtered/hjuYfeA2prM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.79], [7.0, 7.48], [15.0, 15.26], [21.0, 21.73], [23.0, 23.92], [30.0, 31.01], [44.0, 44.44], [46.0, 46.23], [49.0, 49.17], [56.0, 56.49], [58.0, 58.58], [61.0, 61.11], [65.0, 65.62], [70.0, 71.1], [73.0, 72.82], [75.0, 75.1], [79.0, 80.96], [81.0, 82.21], [83.0, 83.42], [88.0, 88.4], [95.0, 96.99], [98.0, 98.46], [101.0, 102.42], [103.0, 104.26], [106.0, 106.14], [108.0, 109.36], [111.0, 111.81], [112.0, 112.82], [113.0, 113.7], [115.0, 116.18], [118.0, 118.12], [121.0, 122.0], [124.0, 124.9], [127.0, 127.62], [128.0, 129.05], [130.0, 131.63], [132.0, 133.17], [137.0, 140.78], [141.0, 141.69], [144.0, 144.61], [146.0, 146.45], [148.0, 148.95], [150.0, 150.62], [151.0, 151.9], [152.0, 154.25], [158.0, 160.44], [161.0, 161.92], [163.0, 163.54], [166.0, 167.53], [168.0, 169.21], [169.0, 171.96], [173.0, 172.79], [173.0, 173.69], [176.0, 176.47], [178.0, 178.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.37, 45.18, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 20.65], ["moo", 18.41], ["livestock, farm animals, working animals", 15.55]], [["stomach rumble", 73.33], ["hum", 5.94], ["throbbing", 4.1]], null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.48, 0.26, 0.73, 0.92, 1.01, 0.44, 0.23, 0.17, 0.49, 0.58, 0.11, 0.62, 1.1, -0.18, 0.1, 1.96, 1.21, 0.42, 0.4, 1.99, 0.46, 1.42, 1.26, 0.14, 1.36, 0.81, 0.82, 0.7, 1.18, 0.12, 1.0, 0.9, 0.62, 1.05, 1.63, 1.17, 3.78, 0.69, 0.61, 0.45, 0.95, 0.62, 0.9, 2.25, 2.44, 0.92, 0.54, 1.53, 1.21, 2.96, -0.21, 0.69, 0.47, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/hjuvr5uGA4s_filtered.json b/annotations_filtered/hjuvr5uGA4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f38dd0034648164fa9aab52214585dd606147ba --- /dev/null +++ b/annotations_filtered/hjuvr5uGA4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.79], [5.0, 5.85], [6.0, 8.38], [9.0, 9.61], [10.0, 10.77], [11.0, 12.29], [13.0, 15.42], [16.0, 16.93], [17.0, 18.44], [19.0, 19.7], [21.0, 21.51], [22.0, 22.76], [29.0, 29.17], [31.0, 31.35], [35.0, 36.48], [37.0, 37.59], [39.0, 40.37], [41.0, 42.01], [42.0, 43.11], [44.0, 44.25], [47.0, 47.28], [49.0, 49.71], [51.0, 51.51], [52.0, 52.83], [55.0, 55.59], [56.0, 56.74], [57.0, 58.35], [59.0, 59.66], [62.0, 61.72], [62.0, 62.36], [63.0, 66.75], [68.0, 68.34], [70.0, 70.38], [72.0, 85.41], [86.0, 87.15], [88.0, 88.45], [91.0, 99.13], [100.0, 101.61], [102.0, 104.13], [105.0, 105.97], [110.0, 110.69], [126.0, 126.67], [129.0, 128.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.58, 0.0, 0.0, 34.98, 0.0, 0.0, 99.97, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.78], ["dial tone", 21.87], ["sidetone", 15.0]], null, null, [["animal", 26.66], ["cattle, bovinae", 8.6], ["dog", 7.09]], null, null, null, null, null, null, null, null, null], "duration": [-0.21, 0.85, 2.38, 0.61, 0.77, 1.29, 2.42, 0.93, 1.44, 0.7, 0.51, 0.76, 0.17, 0.35, 1.48, 0.59, 1.37, 1.01, 1.11, 0.25, 0.28, 0.71, 0.51, 0.83, 0.59, 0.74, 1.35, 0.66, -0.28, 0.36, 3.75, 0.34, 0.38, 13.41, 1.15, 0.45, 8.13, 1.61, 2.13, 0.97, 0.69, 0.67, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/hjyWtmbAyco_filtered.json b/annotations_filtered/hjyWtmbAyco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19ad8c7eb63cd565d88286e708745835efe4763b --- /dev/null +++ b/annotations_filtered/hjyWtmbAyco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.89], [6.0, 7.05], [10.0, 11.23], [12.0, 13.24], [14.0, 15.99], [17.0, 18.35], [20.0, 24.46], [27.0, 28.71], [30.0, 34.48], [35.0, 41.5], [43.0, 44.17], [45.0, 48.14], [50.0, 50.8], [54.0, 55.04], [59.0, 64.25], [68.0, 67.73], [69.0, 70.12], [71.0, 73.06], [82.0, 82.51], [85.0, 86.8], [88.0, 88.62], [95.0, 96.16], [97.0, 100.77], [104.0, 104.48], [105.0, 106.39], [115.0, 115.59], [120.0, 126.66], [140.0, 147.87]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 0.0, 44.87, 39.54, 0.0, 46.4, 0.0, 0.0, 46.22, 0.0, 0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 33.28, 32.66], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 47.53], ["speech", 22.73], ["bass guitar", 2.24]], null, [["music", 35.66], ["hum", 11.73], ["mains hum", 10.32]], [["music", 51.08], ["speech", 10.51], ["didgeridoo", 5.88]], null, [["mains hum", 42.71], ["hum", 33.65], ["throbbing", 5.72]], null, null, [["music", 71.41], ["didgeridoo", 4.03], ["hum", 3.0]], null, null, [["music", 30.33], ["hum", 13.23], ["throbbing", 11.69]], null, null, null, null, [["music", 40.87], ["hum", 10.22], ["throbbing", 9.74]], null, null, null, [["music", 31.04], ["speech", 23.39], ["boing", 9.39]], [["music", 27.77], ["throbbing", 23.08], ["hum", 17.82]]], "duration": [-0.11, 1.05, 1.23, 1.24, 1.99, 1.35, 4.46, 1.71, 4.48, 6.5, 1.17, 3.14, 0.8, 1.04, 5.25, -0.27, 1.12, 2.06, 0.51, 1.8, 0.62, 1.16, 3.77, 0.48, 1.39, 0.59, 6.66, 7.87]} \ No newline at end of file diff --git a/annotations_filtered/hk6Vxhx28bo_filtered.json b/annotations_filtered/hk6Vxhx28bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3355c86a859ce2f85370a52d6fdf610fae108d8c --- /dev/null +++ b/annotations_filtered/hk6Vxhx28bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.27], [14.0, 15.01], [16.0, 19.75], [29.0, 29.62], [33.0, 33.74], [38.0, 53.13], [57.0, 64.23], [66.0, 67.63], [76.0, 88.3], [93.0, 115.37], [119.0, 123.94]], "keep_status": [false, false, true, false, false, true, false, false, false, true, true], "silence_prob": [33.49, 0.0, 32.33, 0.0, 0.0, 31.1, 31.57, 0.0, 31.55, 30.6, 30.81], "audiomae_on_audioset": [[["music", 71.83], ["speech", 9.92], ["moo", 2.17]], null, [["music", 30.87], ["sidetone", 19.15], ["speech", 17.8]], null, null, [["music", 32.83], ["speech", 10.37], ["moo", 6.29]], [["music", 59.16], ["speech", 7.99], ["boing", 5.0]], null, [["music", 71.34], ["boing", 2.36], ["speech", 1.73]], [["music", 53.11], ["moo", 5.98], ["fly, housefly", 5.72]], [["music", 40.56], ["crowd", 19.07], ["speech", 4.86]]], "duration": [2.27, 1.01, 3.75, 0.62, 0.74, 15.13, 7.23, 1.63, 12.3, 22.37, 4.94]} \ No newline at end of file diff --git a/annotations_filtered/hkEXnpQ_c5I_filtered.json b/annotations_filtered/hkEXnpQ_c5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edc72c07cfe57781981dadbaeb997734a7a27843 --- /dev/null +++ b/annotations_filtered/hkEXnpQ_c5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.81], [12.0, 13.04], [28.0, 40.51], [47.0, 90.22], [94.0, 97.28], [102.0, 102.42], [104.0, 104.7], [107.0, 106.98], [107.0, 113.05], [114.0, 115.55], [122.0, 122.5], [124.0, 124.78], [128.0, 130.4], [131.0, 133.02], [138.0, 138.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.27, 0.0, 30.67, 0.0, 37.27, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 78.55, 59.42, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 42.8], ["hum", 27.6], ["music", 17.17]], null, [["moo", 20.99], ["music", 17.45], ["cattle, bovinae", 15.9]], null, null, null, null, null, null, null, null, null, null], "duration": [2.81, 1.04, 12.51, 43.22, 3.28, 0.42, 0.7, -0.02, 6.05, 1.55, 0.5, 0.78, 2.4, 2.02, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/hkFSMV93VeA_filtered.json b/annotations_filtered/hkFSMV93VeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01759a490c04379bb5b987e2b78fd9697b887da5 --- /dev/null +++ b/annotations_filtered/hkFSMV93VeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [7.0, 9.17], [14.0, 15.72], [17.0, 17.14], [18.0, 19.43], [20.0, 21.12], [27.0, 50.19], [54.0, 58.29], [61.0, 61.57], [62.0, 61.74], [62.0, 71.63], [78.0, 81.9], [82.0, 114.05], [120.0, 121.46], [123.0, 124.28], [127.0, 129.36], [140.0, 140.68]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 39.89, 33.44, 0.0, 0.0, 39.14, 32.2, 0.0, 0.0, 0.0, 40.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 54.27], ["livestock, farm animals, working animals", 8.21], ["cattle, bovinae", 5.34]], [["music", 25.77], ["speech", 22.26], ["explosion", 4.07]], null, null, [["cattle, bovinae", 40.96], ["livestock, farm animals, working animals", 36.45], ["moo", 21.06]], [["music", 43.23], ["synthesizer", 8.21], ["musical instrument", 5.19]], null, null, null, [["sidetone", 47.36], ["speech", 6.66], ["moo", 6.09]], null], "duration": [0.15, 2.17, 1.72, 0.14, 1.43, 1.12, 23.19, 4.29, 0.57, -0.26, 9.63, 3.9, 32.05, 1.46, 1.28, 2.36, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/hktlkG0QuKY_filtered.json b/annotations_filtered/hktlkG0QuKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a512e3fad5fe530b9cc69a83da2c1acf6ae14182 --- /dev/null +++ b/annotations_filtered/hktlkG0QuKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.71], [29.0, 42.75], [45.0, 51.54], [54.0, 61.74], [64.0, 75.74], [77.0, 77.92], [83.0, 84.21], [85.0, 85.68], [90.0, 91.64], [93.0, 94.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.66, 31.2, 31.99, 41.76, 38.97, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.83], ["throbbing", 7.52], ["hum", 4.07]], [["music", 61.98], ["speech", 14.5], ["didgeridoo", 7.3]], [["speech", 58.02], ["music", 20.88], ["hum", 4.5]], [["fly, housefly", 38.63], ["bee, wasp, etc.", 20.81], ["insect", 19.16]], [["music", 50.09], ["hum", 20.9], ["throbbing", 5.5]], null, null, null, null, null], "duration": [2.71, 13.75, 6.54, 7.74, 11.74, 0.92, 1.21, 0.68, 1.64, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/hl1z_vp3kXg_filtered.json b/annotations_filtered/hl1z_vp3kXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4665ce593e12741b239830311168566ccf4cd36 --- /dev/null +++ b/annotations_filtered/hl1z_vp3kXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.66], [9.0, 9.85], [23.0, 37.32], [45.0, 46.67], [48.0, 48.37], [53.0, 54.57], [62.0, 61.77], [74.0, 76.4], [79.0, 99.18]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.24, 0.0, 0.0, 0.0, 0.0, 92.8, 32.54], "audiomae_on_audioset": [null, null, [["music", 21.88], ["livestock, farm animals, working animals", 14.01], ["cattle, bovinae", 11.97]], null, null, null, null, null, [["music", 47.35], ["didgeridoo", 17.23], ["theremin", 14.69]]], "duration": [1.66, 0.85, 14.32, 1.67, 0.37, 1.57, -0.23, 2.4, 20.18]} \ No newline at end of file diff --git a/annotations_filtered/hl31RQCC_Bc_filtered.json b/annotations_filtered/hl31RQCC_Bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c74c07ea9953852da0d63d146bf6579c0dad9b2 --- /dev/null +++ b/annotations_filtered/hl31RQCC_Bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.71], [19.0, 20.11], [20.0, 22.84], [24.0, 26.45], [28.0, 41.28], [42.0, 58.95], [60.0, 60.71], [62.0, 63.02], [65.0, 66.24], [69.0, 69.21], [71.0, 71.51], [72.0, 73.01], [74.0, 74.58], [76.0, 76.47], [78.0, 93.68], [97.0, 101.29], [108.0, 108.84], [110.0, 110.49], [111.0, 111.52], [116.0, 117.41], [118.0, 119.48], [120.0, 122.81], [124.0, 124.55], [126.0, 126.5], [131.0, 130.91], [135.0, 135.73], [138.0, 138.27], [141.0, 141.94], [145.0, 145.57], [147.0, 149.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.78, 99.87, 70.16, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 1.11, 2.84, 2.45, 13.28, 16.95, 0.71, 1.02, 1.24, 0.21, 0.51, 1.01, 0.58, 0.47, 15.68, 4.29, 0.84, 0.49, 0.52, 1.41, 1.48, 2.81, 0.55, 0.5, -0.09, 0.73, 0.27, 0.94, 0.57, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/hl8e9i6YiA8_filtered.json b/annotations_filtered/hl8e9i6YiA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3202c9f6b2e33168e8354f714b1ded816baede6a --- /dev/null +++ b/annotations_filtered/hl8e9i6YiA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.99], [20.0, 22.18], [25.0, 34.25], [38.0, 55.75], [57.0, 64.5], [66.0, 106.68], [108.0, 109.95], [110.0, 114.24], [115.0, 116.34], [117.0, 118.0], [119.0, 120.29]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [31.28, 29.33, 29.37, 31.7, 29.52, 0.0, 0.0, 42.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.09], ["speech", 4.76], ["musical instrument", 3.02]], [["music", 49.15], ["speech", 13.96], ["cacophony", 6.72]], [["music", 52.82], ["speech", 14.55], ["hum", 4.59]], [["music", 46.86], ["speech", 33.3], ["musical instrument", 1.68]], [["music", 28.53], ["speech", 20.12], ["whack, thwack", 11.22]], null, null, [["hum", 25.85], ["music", 24.64], ["throbbing", 12.13]], null, null, null], "duration": [12.99, 2.18, 9.25, 17.75, 7.5, 40.68, 1.95, 4.24, 1.34, 1.0, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/hlKMLkrSrDo_filtered.json b/annotations_filtered/hlKMLkrSrDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1408029ec37dcb2d2257499dac8703938351e2df --- /dev/null +++ b/annotations_filtered/hlKMLkrSrDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [4.0, 4.82], [7.0, 7.7], [11.0, 12.02], [13.0, 14.77], [16.0, 17.98], [19.0, 20.55], [24.0, 25.56], [27.0, 27.73], [32.0, 32.24], [34.0, 34.55], [36.0, 38.38], [39.0, 39.46], [40.0, 41.57], [44.0, 45.01], [52.0, 56.29], [58.0, 59.46], [60.0, 60.78], [62.0, 62.36], [62.0, 64.0], [65.0, 65.03], [71.0, 72.03], [73.0, 73.04], [75.0, 75.88], [77.0, 77.85], [80.0, 80.72], [82.0, 83.0], [84.0, 85.4], [87.0, 87.79], [89.0, 89.56], [92.0, 92.96], [94.0, 95.45], [96.0, 97.87], [99.0, 99.66], [106.0, 106.84], [108.0, 108.8], [110.0, 114.34], [116.0, 117.27], [120.0, 126.84], [127.0, 128.73], [131.0, 131.65], [136.0, 136.85], [145.0, 145.86], [152.0, 152.41], [157.0, 158.06], [158.0, 159.02], [165.0, 171.24], [172.0, 172.79], [175.0, 175.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 39.89], ["music", 39.0], ["hum", 6.56]], null, null], "duration": [1.18, 0.82, 0.7, 1.02, 1.77, 1.98, 1.55, 1.56, 0.73, 0.24, 0.55, 2.38, 0.46, 1.57, 1.01, 4.29, 1.46, 0.78, 0.36, 2.0, 0.03, 1.03, 0.04, 0.88, 0.85, 0.72, 1.0, 1.4, 0.79, 0.56, 0.96, 1.45, 1.87, 0.66, 0.84, 0.8, 4.34, 1.27, 6.84, 1.73, 0.65, 0.85, 0.86, 0.41, 1.06, 1.02, 6.24, 0.79, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/hlNvdfv76WA_filtered.json b/annotations_filtered/hlNvdfv76WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..113443b7b2aefa71e1b22e13cba40989c17dd70c --- /dev/null +++ b/annotations_filtered/hlNvdfv76WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 58.46], [58.0, 65.6], [67.0, 90.69], [91.0, 98.14], [101.0, 111.97], [113.0, 124.98], [128.0, 138.1], [139.0, 143.85], [147.0, 151.07], [154.0, 154.85], [160.0, 163.73], [170.0, 177.15], [179.0, 179.58], [181.0, 188.3]], "keep_status": [false, true, false, false, true, false, true, false, true, false, false, true, false, true], "silence_prob": [0.0, 33.72, 33.26, 62.47, 38.12, 31.88, 47.62, 45.18, 46.94, 0.0, 77.03, 35.74, 0.0, 38.1], "audiomae_on_audioset": [null, [["music", 60.57], ["musical instrument", 3.88], ["whale vocalization", 3.51]], [["music", 47.13], ["theremin", 30.14], ["wind instrument, woodwind instrument", 6.2]], null, [["speech", 33.37], ["music", 23.52], ["whip", 5.12]], [["music", 40.06], ["theremin", 20.72], ["whale vocalization", 11.54]], [["buzz", 24.79], ["music", 15.39], ["bee, wasp, etc.", 6.06]], [["fly, housefly", 43.94], ["insect", 37.43], ["bee, wasp, etc.", 11.79]], [["fly, housefly", 33.83], ["insect", 14.08], ["music", 12.53]], null, null, [["music", 49.08], ["speech", 6.88], ["livestock, farm animals, working animals", 4.8]], null, [["music", 46.8], ["hum", 11.55], ["throbbing", 6.76]]], "duration": [0.46, 7.6, 23.69, 7.14, 10.97, 11.98, 10.1, 4.85, 4.07, 0.85, 3.73, 7.15, 0.58, 7.3]} \ No newline at end of file diff --git a/annotations_filtered/hlWL5Az4pow_filtered.json b/annotations_filtered/hlWL5Az4pow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76bbcbc2113417d8f05ddb1b710ecfbd2bd68c63 --- /dev/null +++ b/annotations_filtered/hlWL5Az4pow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.12], [9.0, 14.22], [16.0, 23.31], [27.0, 30.94], [34.0, 35.5], [38.0, 38.3], [40.0, 43.01], [57.0, 58.63], [61.0, 67.27], [72.0, 72.55], [74.0, 73.99], [83.0, 83.69], [89.0, 99.32], [102.0, 103.65], [105.0, 106.81], [108.0, 110.27], [125.0, 126.93], [129.0, 133.79], [136.0, 136.65], [175.0, 175.59], [178.0, 183.34], [185.0, 195.3], [198.0, 199.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [98.01, 53.91, 40.29, 33.31, 0.0, 0.0, 34.6, 0.0, 33.3, 0.0, 0.0, 0.0, 33.23, 0.0, 0.0, 36.82, 0.0, 34.89, 0.0, 0.0, 33.02, 33.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.27], ["speech", 24.59], ["fly, housefly", 7.96]], [["music", 77.08], ["throbbing", 3.55], ["cacophony", 2.18]], null, null, [["music", 83.62], ["musical instrument", 1.91], ["guitar", 1.5]], null, [["music", 72.31], ["didgeridoo", 2.96], ["funny music", 1.83]], null, null, null, [["music", 42.78], ["livestock, farm animals, working animals", 7.34], ["speech", 7.25]], null, null, [["music", 68.83], ["video game music", 3.06], ["throbbing", 2.8]], null, [["music", 78.65], ["reggae", 2.54], ["electronic music", 1.33]], null, null, [["music", 71.09], ["throbbing", 8.48], ["hum", 3.32]], [["music", 40.68], ["animal", 6.72], ["speech", 5.22]], null], "duration": [2.12, 5.22, 7.31, 3.94, 1.5, 0.3, 3.01, 1.63, 6.27, 0.55, -0.01, 0.69, 10.32, 1.65, 1.81, 2.27, 1.93, 4.79, 0.65, 0.59, 5.34, 10.3, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/hlx-FULnwJs_filtered.json b/annotations_filtered/hlx-FULnwJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f6fec46e1a81f83cae49ffce322c3581c300980 --- /dev/null +++ b/annotations_filtered/hlx-FULnwJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [5.0, 5.48], [8.0, 25.84], [27.0, 31.4], [35.0, 53.45], [57.0, 61.59], [65.0, 65.87], [72.0, 83.71], [85.0, 88.48], [90.0, 91.23], [93.0, 96.6], [100.0, 101.11], [103.0, 103.47], [105.0, 105.48]], "keep_status": [false, false, false, true, false, true, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.92, 34.01, 31.54, 33.61, 0.0, 35.99, 38.5, 0.0, 36.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.53], ["throbbing", 25.65], ["hum", 5.93]], [["music", 32.41], ["speech", 16.16], ["didgeridoo", 13.58]], [["music", 39.18], ["throbbing", 20.59], ["hum", 10.81]], [["hum", 22.3], ["music", 21.13], ["throbbing", 20.42]], null, [["music", 22.48], ["speech", 7.79], ["hum", 7.79]], [["music", 48.79], ["speech", 5.87], ["didgeridoo", 3.83]], null, [["music", 37.98], ["speech", 16.4], ["boing", 10.9]], null, null, null], "duration": [0.38, 0.48, 17.84, 4.4, 18.45, 4.59, 0.87, 11.71, 3.48, 1.23, 3.6, 1.11, 0.47, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/hlzm7-gvTRg_filtered.json b/annotations_filtered/hlzm7-gvTRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea0e38b041913d6845235dcadb31a140a94fcdc3 --- /dev/null +++ b/annotations_filtered/hlzm7-gvTRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [5.0, 5.88], [7.0, 8.09], [12.0, 13.8], [25.0, 27.01], [28.0, 29.37], [31.0, 31.13], [36.0, 48.41], [52.0, 53.49], [54.0, 55.26], [56.0, 56.81], [59.0, 60.81], [65.0, 67.31], [73.0, 72.69], [74.0, 74.12], [75.0, 75.24], [77.0, 78.53], [86.0, 86.34], [87.0, 89.28], [90.0, 91.0], [95.0, 95.4], [96.0, 97.28], [98.0, 98.78], [99.0, 100.11], [104.0, 107.27], [113.0, 114.4], [115.0, 121.47], [123.0, 123.23], [124.0, 123.77], [124.0, 133.76], [134.0, 134.92], [135.0, 135.8], [138.0, 138.54], [140.0, 141.03], [142.0, 143.31], [146.0, 146.79], [154.0, 155.12], [156.0, 155.83], [157.0, 157.86], [160.0, 160.84], [165.0, 171.34], [174.0, 177.72], [180.0, 184.28], [186.0, 189.08], [190.0, 192.94], [195.0, 197.67], [200.0, 207.32], [209.0, 210.19], [211.0, 211.76], [215.0, 215.69], [216.0, 219.0], [222.0, 223.74], [226.0, 227.94], [229.0, 230.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 100.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 96.77, 100.0, 47.39, 99.99, 100.0, 94.37, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.87], ["noise", 11.62], ["music", 11.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.34], ["busy signal", 3.9], ["telephone", 3.57]], null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.88, 1.09, 1.8, 2.01, 1.37, 0.13, 12.41, 1.49, 1.26, 0.81, 1.81, 2.31, -0.31, 0.12, 0.24, 1.53, 0.34, 2.28, 1.0, 0.4, 1.28, 0.78, 1.11, 3.27, 1.4, 6.47, 0.23, -0.23, 9.76, 0.92, 0.8, 0.54, 1.03, 1.31, 0.79, 1.12, -0.17, 0.86, 0.84, 6.34, 3.72, 4.28, 3.08, 2.94, 2.67, 7.32, 1.19, 0.76, 0.69, 3.0, 1.74, 1.94, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/hm9ZzMSoPB4_filtered.json b/annotations_filtered/hm9ZzMSoPB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e6fb49cbd538e043639a954eb88673a0cd33b38 --- /dev/null +++ b/annotations_filtered/hm9ZzMSoPB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [11.0, 16.87], [20.0, 20.04], [21.0, 23.25], [25.0, 26.05], [26.0, 28.58], [29.0, 29.57], [32.0, 44.64], [46.0, 46.55], [49.0, 52.2], [54.0, 54.99], [56.0, 57.35], [59.0, 63.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.8, 0.0, 49.31, 0.0, 50.02, 0.0, 55.89, 0.0, 63.64, 0.0, 0.0, 95.09], "audiomae_on_audioset": [null, [["thunk", 43.96], ["music", 27.87], ["speech", 12.83]], null, [["music", 51.37], ["speech", 15.32], ["foghorn", 11.1]], null, null, null, null, null, null, null, null, null], "duration": [1.16, 5.87, 0.04, 2.25, 1.05, 2.58, 0.57, 12.64, 0.55, 3.2, 0.99, 1.35, 4.71]} \ No newline at end of file diff --git a/annotations_filtered/hmF_IO6Aiag_filtered.json b/annotations_filtered/hmF_IO6Aiag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65561b4d27a7cdf762f01e3e0bf65bdeb081a2a0 --- /dev/null +++ b/annotations_filtered/hmF_IO6Aiag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 75.73], [78.0, 78.65], [81.0, 83.4], [89.0, 89.46]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 76.53, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [72.73, 0.65, 2.4, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/hmYIR6v-oVE_filtered.json b/annotations_filtered/hmYIR6v-oVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26acfb271e311558d9d4f34f5d1f0c1ef387608a --- /dev/null +++ b/annotations_filtered/hmYIR6v-oVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.4], [5.0, 6.2], [7.0, 8.56], [12.0, 12.11], [13.0, 12.9], [14.0, 14.45], [16.0, 16.65], [19.0, 19.57], [21.0, 21.3], [23.0, 23.62], [25.0, 26.35], [29.0, 29.96], [31.0, 32.97], [34.0, 35.56], [37.0, 38.13], [39.0, 39.23], [41.0, 41.4], [42.0, 45.69], [49.0, 50.33], [62.0, 62.5], [69.0, 94.76], [96.0, 98.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 37.66, 99.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 58.34], ["mains hum", 17.61], ["speech", 5.23]], null], "duration": [1.4, 1.2, 1.56, 0.11, -0.1, 0.45, 0.65, 0.57, 0.3, 0.62, 1.35, 0.96, 1.97, 1.56, 1.13, 0.23, 0.4, 3.69, 1.33, 0.5, 25.76, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/hn09SKCZgtI_filtered.json b/annotations_filtered/hn09SKCZgtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e42af96019c0c4561a537652fe6c7cd3a4d9490 --- /dev/null +++ b/annotations_filtered/hn09SKCZgtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.06], [5.0, 6.3], [8.0, 12.73], [15.0, 20.12], [21.0, 22.6], [26.0, 50.8]], "keep_status": [false, false, true, false, false, false], "silence_prob": [49.22, 0.0, 44.87, 46.75, 0.0, 86.45], "audiomae_on_audioset": [[["telephone dialing, dtmf", 67.76], ["dial tone", 6.99], ["hum", 5.58]], null, [["hum", 33.9], ["mains hum", 12.32], ["speech", 7.2]], [["hum", 28.51], ["mains hum", 28.16], ["telephone dialing, dtmf", 18.88]], null, null], "duration": [3.06, 1.3, 4.73, 5.12, 1.6, 24.8]} \ No newline at end of file diff --git a/annotations_filtered/hn3XR4o8M4c_filtered.json b/annotations_filtered/hn3XR4o8M4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73744fed5d2f6944728e0293f4b4ad3326b528e3 --- /dev/null +++ b/annotations_filtered/hn3XR4o8M4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [12.0, 12.21], [14.0, 14.4], [17.0, 18.87], [24.0, 28.58], [36.0, 36.8], [38.0, 38.91], [43.0, 45.47], [48.0, 50.92], [52.0, 53.7], [56.0, 57.15], [58.0, 58.53], [59.0, 59.61], [61.0, 61.1], [64.0, 64.84], [65.0, 66.36], [68.0, 68.59], [74.0, 74.39], [77.0, 78.75], [85.0, 93.48], [100.0, 100.5], [103.0, 102.88], [105.0, 132.44], [137.0, 145.15], [145.0, 149.76], [150.0, 150.74], [170.0, 170.83], [172.0, 172.13], [172.0, 176.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.31, 0.0, 0.0, 31.81, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.83, 0.0, 0.0, 41.1, 61.97, 41.07, 0.0, 0.0, 0.0, 37.33], "audiomae_on_audioset": [null, null, null, null, [["speech", 38.6], ["music", 34.15], ["hum", 3.72]], null, null, [["speech", 9.58], ["whack, thwack", 8.24], ["squeak", 7.47]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.68], ["music", 27.89], ["whack, thwack", 6.34]], null, null, [["music", 50.21], ["hum", 7.33], ["mains hum", 6.64]], null, [["cattle, bovinae", 23.86], ["music", 18.21], ["livestock, farm animals, working animals", 16.8]], null, null, null, [["music", 37.54], ["speech", 24.96], ["didgeridoo", 9.38]]], "duration": [1.41, 0.21, 0.4, 1.87, 4.58, 0.8, 0.91, 2.47, 2.92, 1.7, 1.15, 0.53, 0.61, 0.1, 0.84, 1.36, 0.59, 0.39, 1.75, 8.48, 0.5, -0.12, 27.44, 8.15, 4.76, 0.74, 0.83, 0.13, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/hnCQCX3AHzY_filtered.json b/annotations_filtered/hnCQCX3AHzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c62ce1d8ffd323816c957b9dbd3b4b6b65fdd8a8 --- /dev/null +++ b/annotations_filtered/hnCQCX3AHzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [25.0, 25.49], [32.0, 32.81], [36.0, 36.49], [54.0, 55.41], [64.0, 64.0], [64.0, 72.01], [74.0, 75.39], [76.0, 78.06], [79.0, 80.1], [81.0, 81.5], [84.0, 85.46], [86.0, 86.34], [87.0, 88.5], [89.0, 90.42], [92.0, 92.8], [105.0, 106.79], [108.0, 111.32], [124.0, 124.46], [127.0, 128.8], [144.0, 146.96], [154.0, 155.61], [162.0, 162.03], [167.0, 167.27], [168.0, 168.61], [170.0, 169.86], [177.0, 182.29], [184.0, 184.98], [186.0, 186.09], [193.0, 193.11], [195.0, 195.35], [202.0, 202.91], [207.0, 207.03], [211.0, 217.83]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 0.0, 29.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.29], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 53.58], ["electric shaver, electric razor", 7.17], ["hum", 6.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.41], ["fly, housefly", 27.38], ["insect", 7.4]], null, null, null, null, null, [["speech", 40.26], ["vehicle", 20.63], ["outside, rural or natural", 4.02]], null, null, null, null, null, null, [["fly, housefly", 33.31], ["speech", 9.9], ["insect", 9.86]]], "duration": [0.31, 0.49, 0.81, 0.49, 1.41, 0.0, 8.01, 1.39, 2.06, 1.1, 0.5, 1.46, 0.34, 1.5, 1.42, 0.8, 1.79, 3.32, 0.46, 1.8, 2.96, 1.61, 0.03, 0.27, 0.61, -0.14, 5.29, 0.98, 0.09, 0.11, 0.35, 0.91, 0.03, 6.83]} \ No newline at end of file diff --git a/annotations_filtered/hnNXvk6sLvw_filtered.json b/annotations_filtered/hnNXvk6sLvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a4e9cf98133c759978ccc7aacc4fc767f597ba1 --- /dev/null +++ b/annotations_filtered/hnNXvk6sLvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.34], [10.0, 10.22], [13.0, 13.86], [14.0, 15.57], [18.0, 17.68], [34.0, 34.45], [39.0, 39.51], [42.0, 42.36], [44.0, 46.89], [49.0, 49.92], [51.0, 50.92], [53.0, 53.47], [54.0, 54.58], [59.0, 60.66], [63.0, 64.2], [66.0, 69.84], [71.0, 74.24], [77.0, 77.89], [81.0, 82.05], [89.0, 88.99], [95.0, 96.04], [97.0, 97.83], [110.0, 112.35], [115.0, 114.94], [121.0, 127.09], [130.0, 131.21], [132.0, 156.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 52.39, 0.0, 30.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 50.5], ["insect", 17.33], ["mosquito", 16.79]]], "duration": [2.34, 0.22, 0.86, 1.57, -0.32, 0.45, 0.51, 0.36, 2.89, 0.92, -0.08, 0.47, 0.58, 1.66, 1.2, 3.84, 3.24, 0.89, 1.05, -0.01, 1.04, 0.83, 2.35, -0.06, 6.09, 1.21, 24.1]} \ No newline at end of file diff --git a/annotations_filtered/hnXqavr1ZMQ_filtered.json b/annotations_filtered/hnXqavr1ZMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c0f75ad60d8f0b1f432077568a33feec05c35c2 --- /dev/null +++ b/annotations_filtered/hnXqavr1ZMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.27], [20.0, 20.87], [25.0, 25.42], [36.0, 44.52], [45.0, 44.98], [46.0, 64.44], [85.0, 85.48], [92.0, 96.04], [102.0, 102.79]], "keep_status": [false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.6, 0.0, 31.3, 0.0, 53.84, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 27.24], ["moo", 15.05], ["livestock, farm animals, working animals", 13.82]], null, [["speech", 15.48], ["music", 15.24], ["buzzer", 7.99]], null, null, null], "duration": [0.27, 0.87, 0.42, 8.52, -0.02, 18.44, 0.48, 4.04, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/hnfpujruuv4_filtered.json b/annotations_filtered/hnfpujruuv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a8c650111b378b1c4a2ae0fe744484d85d7b9d3 --- /dev/null +++ b/annotations_filtered/hnfpujruuv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [9.0, 8.95], [9.0, 9.14], [10.0, 12.18], [13.0, 14.66], [18.0, 18.77], [23.0, 23.68], [30.0, 31.11], [39.0, 39.36], [44.0, 48.88], [51.0, 51.75], [57.0, 58.02], [59.0, 60.1], [63.0, 63.54], [64.0, 65.69], [70.0, 71.79], [73.0, 74.85], [84.0, 84.79], [85.0, 88.21], [89.0, 89.45], [101.0, 101.29], [103.0, 103.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, -0.05, 0.14, 2.18, 1.66, 0.77, 0.68, 1.11, 0.36, 4.88, 0.75, 1.02, 1.1, 0.54, 1.69, 1.79, 1.85, 0.79, 3.21, 0.45, 0.29, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/hnsP1etZkr4_filtered.json b/annotations_filtered/hnsP1etZkr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87596399f9126a5bf8226dca97cbd32eab9a08d9 --- /dev/null +++ b/annotations_filtered/hnsP1etZkr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.37], [15.0, 82.14], [83.0, 107.28], [109.0, 109.0], [110.0, 110.98], [112.0, 112.78], [114.0, 115.2], [115.0, 116.55], [117.0, 117.75], [119.0, 119.31]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [56.1, 0.0, 47.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 35.2], ["moo", 18.61], ["livestock, farm animals, working animals", 15.52]], null, null, null, null, null, null, null], "duration": [8.37, 67.14, 24.28, 0.0, 0.98, 0.78, 1.2, 1.55, 0.75, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/hnum8SxuVCQ_filtered.json b/annotations_filtered/hnum8SxuVCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1abe87dd0c5d29fadb468e5f21bb11673318abd0 --- /dev/null +++ b/annotations_filtered/hnum8SxuVCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [14.0, 16.65], [18.0, 25.96], [27.0, 30.67], [31.0, 48.32], [50.0, 50.8], [51.0, 51.78], [55.0, 56.57], [58.0, 58.82], [62.0, 64.74], [67.0, 88.6], [97.0, 100.79], [102.0, 108.75], [114.0, 114.15], [117.0, 119.58]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.75, 37.35, 43.38, 77.7, 0.0, 0.0, 0.0, 0.0, 67.89, 61.47, 63.53, 66.39, 0.0, 69.2], "audiomae_on_audioset": [null, null, [["hum", 25.01], ["throbbing", 18.91], ["mains hum", 14.14]], [["sidetone", 68.18], ["speech", 20.95], ["hum", 1.84]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 2.65, 7.96, 3.67, 17.32, 0.8, 0.78, 1.57, 0.82, 2.74, 21.6, 3.79, 6.75, 0.15, 2.58]} \ No newline at end of file diff --git a/annotations_filtered/hoKvbJSMShA_filtered.json b/annotations_filtered/hoKvbJSMShA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74e2d9356fa285ca884147114b004e5cfb2d929a --- /dev/null +++ b/annotations_filtered/hoKvbJSMShA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [4.0, 14.05], [14.0, 15.63], [17.0, 17.14], [18.0, 17.86], [20.0, 20.21], [21.0, 22.4], [24.0, 24.54], [27.0, 27.04], [27.0, 29.83], [30.0, 30.43], [31.0, 31.77], [33.0, 35.02], [36.0, 38.06], [39.0, 42.06], [43.0, 44.39], [45.0, 46.65], [48.0, 48.56], [50.0, 50.58], [51.0, 51.29], [52.0, 52.73], [53.0, 53.45], [54.0, 56.51], [58.0, 59.54], [60.0, 62.11], [62.0, 64.18], [65.0, 72.32], [73.0, 74.93], [75.0, 76.0], [78.0, 82.38], [83.0, 83.59], [85.0, 85.58], [86.0, 86.64], [95.0, 96.62], [99.0, 99.59], [102.0, 103.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 89.36, 74.29, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 47.62, 54.36, 33.64, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 29.17], ["music", 27.31], ["speech", 19.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.21], ["vehicle", 3.86], ["cattle, bovinae", 3.77]], null, [["vehicle", 20.61], ["whale vocalization", 11.84], ["speech", 6.66]], null, null, null, null, null, null, null, null, null], "duration": [1.89, 10.05, 1.63, 0.14, -0.14, 0.21, 1.4, 0.54, 0.04, 2.83, 0.43, 0.77, 2.02, 2.06, 3.06, 1.39, 1.65, 0.56, 0.58, 0.29, 0.73, 0.45, 2.51, 1.54, 2.11, 2.18, 7.32, 1.93, 1.0, 4.38, 0.59, 0.58, 0.64, 1.62, 0.59, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/hoWEYBSlctc_filtered.json b/annotations_filtered/hoWEYBSlctc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d7a459d4f38f99c2fb34e57cfbf104bf370f98b --- /dev/null +++ b/annotations_filtered/hoWEYBSlctc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.23], [15.0, 18.05], [19.0, 20.16], [26.0, 25.83], [28.0, 30.28], [36.0, 36.64], [38.0, 38.79], [41.0, 41.62], [48.0, 48.44], [50.0, 50.79], [52.0, 52.14], [59.0, 58.75], [61.0, 68.5], [69.0, 69.72], [83.0, 83.54], [88.0, 89.77], [92.0, 92.48], [94.0, 94.95], [96.0, 96.5], [98.0, 98.25], [106.0, 106.56], [108.0, 108.03], [114.0, 115.26], [116.0, 116.63], [120.0, 120.63], [125.0, 125.91], [126.0, 127.41], [129.0, 129.56], [134.0, 135.21], [141.0, 141.35], [145.0, 145.99], [148.0, 150.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.73, 49.54, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67], "audiomae_on_audioset": [[["music", 77.39], ["speech", 8.26], ["musical instrument", 3.65]], [["telephone dialing, dtmf", 37.13], ["telephone", 17.66], ["speech", 15.71]], null, null, [["music", 46.35], ["speech", 29.71], ["radio", 2.3]], null, null, null, null, null, null, null, [["sidetone", 30.4], ["music", 26.24], ["hum", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.23, 3.05, 1.16, -0.17, 2.28, 0.64, 0.79, 0.62, 0.44, 0.79, 0.14, -0.25, 7.5, 0.72, 0.54, 1.77, 0.48, 0.95, 0.5, 0.25, 0.56, 0.03, 1.26, 0.63, 0.63, 0.91, 1.41, 0.56, 1.21, 0.35, 0.99, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/hoe24aSvLtw_filtered.json b/annotations_filtered/hoe24aSvLtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f65a276191383c6c588a4400955dab08ea52ab --- /dev/null +++ b/annotations_filtered/hoe24aSvLtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.64], [14.0, 14.44], [15.0, 15.45], [17.0, 17.9], [20.0, 20.73], [30.0, 32.32], [39.0, 38.77], [40.0, 40.07], [41.0, 41.69], [42.0, 43.17], [55.0, 55.71], [60.0, 61.16], [63.0, 63.71], [64.0, 66.5], [68.0, 68.35], [69.0, 69.87], [70.0, 72.96], [73.0, 74.7], [75.0, 75.36], [76.0, 76.55], [82.0, 85.01], [90.0, 90.22], [91.0, 91.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.44, 0.45, 0.9, 0.73, 2.32, -0.23, 0.07, 0.69, 1.17, 0.71, 1.16, 0.71, 2.5, 0.35, 0.87, 2.96, 1.7, 0.36, 0.55, 3.01, 0.22, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/hohZbtTAtRA_filtered.json b/annotations_filtered/hohZbtTAtRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46f84bf981cd92247fccd3e0ecbf7079f4e8c42c --- /dev/null +++ b/annotations_filtered/hohZbtTAtRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.03], [13.0, 14.4], [15.0, 16.21], [17.0, 17.83], [19.0, 19.2], [21.0, 21.9], [25.0, 26.45], [33.0, 33.32], [35.0, 35.73], [39.0, 40.26], [42.0, 47.29], [49.0, 49.81], [54.0, 56.05], [57.0, 58.82], [60.0, 60.49], [62.0, 62.48], [66.0, 66.36], [68.0, 70.33], [71.0, 72.71], [73.0, 76.13], [77.0, 77.36], [78.0, 79.39], [87.0, 87.49], [88.0, 89.72], [97.0, 98.54], [100.0, 99.99], [100.0, 100.82], [102.0, 102.52], [104.0, 104.55], [106.0, 106.42], [108.0, 109.68], [110.0, 115.15], [116.0, 129.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 43.98, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 72.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 46.06], ["speech", 12.21], ["speech synthesizer", 5.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 1.4, 1.21, 0.83, 0.2, 0.9, 1.45, 0.32, 0.73, 1.26, 5.29, 0.81, 2.05, 1.82, 0.49, 0.48, 0.36, 2.33, 1.71, 3.13, 0.36, 1.39, 0.49, 1.72, 1.54, -0.01, 0.82, 0.52, 0.55, 0.42, 1.68, 5.15, 13.56]} \ No newline at end of file diff --git a/annotations_filtered/honAzu3xOP0_filtered.json b/annotations_filtered/honAzu3xOP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2651e170a2e608322230387840bd93a52ab71398 --- /dev/null +++ b/annotations_filtered/honAzu3xOP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [14.0, 14.82], [17.0, 18.89], [20.0, 21.22], [22.0, 23.21], [27.0, 27.31], [28.0, 28.54], [30.0, 30.21], [31.0, 34.53], [36.0, 36.29], [45.0, 49.99], [61.0, 60.86], [89.0, 91.5], [92.0, 93.78], [102.0, 104.85], [108.0, 116.21], [118.0, 118.49], [124.0, 123.99], [126.0, 126.0], [153.0, 153.79], [165.0, 165.59], [194.0, 194.04]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 43.1, 0.0, 33.88, 0.0, 39.52, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 21.38], ["speech", 16.92], ["sidetone", 9.33]], null, [["music", 45.13], ["speech", 15.32], ["sidetone", 5.69]], null, [["speech", 45.37], ["radio", 10.47], ["sidetone", 7.03]], null, [["music", 45.58], ["speech", 14.73], ["sidetone", 5.19]], [["music", 67.55], ["bass guitar", 8.2], ["guitar", 4.7]], null, null, null, null, null, null], "duration": [0.51, 0.82, 1.89, 1.22, 1.21, 0.31, 0.54, 0.21, 3.53, 0.29, 4.99, -0.14, 2.5, 1.78, 2.85, 8.21, 0.49, -0.01, 0.0, 0.79, 0.59, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/hopRenk1oaQ_filtered.json b/annotations_filtered/hopRenk1oaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36cef90cbb68154110d3a7a1bd6ad53bab56083b --- /dev/null +++ b/annotations_filtered/hopRenk1oaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [11.0, 24.78], [27.0, 26.6], [29.0, 29.07], [33.0, 39.5], [45.0, 45.25], [46.0, 68.99], [73.0, 73.62]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.01, 0.0, 0.0, 35.5, 0.0, 39.17, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 30.96], ["music", 26.79], ["mains hum", 14.6]], null, [["music", 78.87], ["musical instrument", 2.44], ["throbbing", 2.36]], null], "duration": [0.49, 13.78, -0.4, 0.07, 6.5, 0.25, 22.99, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/howhfMAoEt0_filtered.json b/annotations_filtered/howhfMAoEt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fda3e6488a353f00c4aa190c896f68e329e0cff --- /dev/null +++ b/annotations_filtered/howhfMAoEt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.03], [7.0, 24.16], [24.0, 26.91], [28.0, 29.0], [30.0, 31.21], [34.0, 34.53], [35.0, 48.14], [50.0, 62.56], [64.0, 65.31], [65.0, 72.72], [73.0, 73.45], [75.0, 77.9], [81.0, 93.72], [94.0, 95.86], [97.0, 99.12], [101.0, 101.98], [102.0, 103.6], [105.0, 107.86], [108.0, 108.9], [109.0, 111.06], [112.0, 116.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.97, 53.78, 97.54, 0.0, 0.0, 0.0, 100.0, 97.64, 0.0, 99.95, 0.0, 99.78, 80.64, 0.0, 97.11, 0.0, 0.0, 95.51, 0.0, 99.1, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.03, 17.16, 2.91, 1.0, 1.21, 0.53, 13.14, 12.56, 1.31, 7.72, 0.45, 2.9, 12.72, 1.86, 2.12, 0.98, 1.6, 2.86, 0.9, 2.06, 4.36]} \ No newline at end of file diff --git a/annotations_filtered/hp3HX9PAkcA_filtered.json b/annotations_filtered/hp3HX9PAkcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55544402fd2a2be5c946b03e018f8251a0ca55c5 --- /dev/null +++ b/annotations_filtered/hp3HX9PAkcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.97], [7.0, 8.87], [9.0, 10.42], [11.0, 12.8], [13.0, 14.17], [14.0, 15.38], [23.0, 25.51], [26.0, 29.08], [29.0, 30.48], [31.0, 32.97], [34.0, 37.86], [44.0, 44.79], [48.0, 48.98], [51.0, 52.62], [54.0, 54.78], [57.0, 59.0], [60.0, 61.33], [64.0, 64.39], [70.0, 71.63], [73.0, 74.22], [79.0, 79.59], [81.0, 81.85], [85.0, 85.72], [87.0, 88.42], [99.0, 99.89], [100.0, 102.78], [111.0, 111.72], [112.0, 113.02], [116.0, 119.2], [121.0, 121.95], [125.0, 126.32], [128.0, 128.63], [130.0, 129.88], [130.0, 131.16], [135.0, 141.34], [143.0, 142.72], [145.0, 145.27], [146.0, 145.54], [146.0, 147.39], [151.0, 151.48], [168.0, 168.4], [169.0, 171.17], [174.0, 176.28], [184.0, 184.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 77.87, 0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 52.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 1.87, 1.42, 1.8, 1.17, 1.38, 2.51, 3.08, 1.48, 1.97, 3.86, 0.79, 0.98, 1.62, 0.78, 2.0, 1.33, 0.39, 1.63, 1.22, 0.59, 0.85, 0.72, 1.42, 0.89, 2.78, 0.72, 1.02, 3.2, 0.95, 1.32, 0.63, -0.12, 1.16, 6.34, -0.28, 0.27, -0.46, 1.39, 0.48, 0.4, 2.17, 2.28, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/hp3n_sA4Sqo_filtered.json b/annotations_filtered/hp3n_sA4Sqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff75e6a8b956e9cb125e7a854dfd2a18fc0ea0c4 --- /dev/null +++ b/annotations_filtered/hp3n_sA4Sqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 61.53], [68.0, 81.21], [86.0, 88.13], [90.0, 90.41], [92.0, 93.53], [94.0, 94.51], [102.0, 103.32], [106.0, 106.88], [108.0, 108.55], [110.0, 110.03], [112.0, 112.48], [113.0, 116.29], [119.0, 118.89], [119.0, 124.97]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.82, 31.72, 44.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 37.17], "audiomae_on_audioset": [[["music", 61.99], ["throbbing", 10.32], ["sampler", 2.88]], [["music", 79.7], ["cacophony", 2.57], ["synthesizer", 2.11]], [["music", 51.21], ["speech", 5.25], ["electronic music", 4.87]], null, null, null, null, null, null, null, null, [["music", 65.05], ["electronic music", 3.96], ["electronica", 3.26]], null, [["music", 61.09], ["speech", 9.1], ["throbbing", 4.17]]], "duration": [23.53, 13.21, 2.13, 0.41, 1.53, 0.51, 1.32, 0.88, 0.55, 0.03, 0.48, 3.29, -0.11, 5.97]} \ No newline at end of file diff --git a/annotations_filtered/hpDjzODXpBQ_filtered.json b/annotations_filtered/hpDjzODXpBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e62a5c579bf65abe82fb62730bf2bbeffccfde1 --- /dev/null +++ b/annotations_filtered/hpDjzODXpBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [11.0, 12.41], [14.0, 14.61], [16.0, 16.19], [17.0, 17.09], [20.0, 19.8], [20.0, 21.36], [22.0, 23.33], [27.0, 27.72], [28.0, 29.64], [31.0, 31.78], [33.0, 33.4], [34.0, 37.84], [38.0, 38.45], [41.0, 41.88], [44.0, 44.46], [48.0, 48.29], [49.0, 49.05], [50.0, 50.79], [51.0, 51.11], [51.0, 55.36], [57.0, 71.64], [72.0, 72.08], [77.0, 85.75], [87.0, 94.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 38.68, 0.0, 37.49, 34.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.6], ["speech", 14.97], ["guitar", 1.39]], null, [["music", 85.67], ["synthetic singing", 2.15], ["rock and roll", 1.17]], [["music", 78.08], ["didgeridoo", 2.68], ["musical instrument", 2.41]]], "duration": [0.17, 1.41, 0.61, 0.19, 0.09, -0.2, 1.36, 1.33, 0.72, 1.64, 0.78, 0.4, 3.84, 0.45, 0.88, 0.46, 0.29, 0.05, 0.79, 0.11, 4.36, 14.64, 0.08, 8.75, 7.66]} \ No newline at end of file diff --git a/annotations_filtered/hpb2-ZOzc_o_filtered.json b/annotations_filtered/hpb2-ZOzc_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc21097fb35f192025c4a3e750f62cde3cc9a5a --- /dev/null +++ b/annotations_filtered/hpb2-ZOzc_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.31], [26.0, 73.65], [77.0, 106.89]], "keep_status": [false, false, false], "silence_prob": [81.89, 0.0, 31.32], "audiomae_on_audioset": [null, null, [["music", 39.14], ["whale vocalization", 27.15], ["cacophony", 5.49]]], "duration": [2.31, 47.65, 29.89]} \ No newline at end of file diff --git a/annotations_filtered/hpliHwPiYYU_filtered.json b/annotations_filtered/hpliHwPiYYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a931ca415ea2813441f566190313e37e56bff460 --- /dev/null +++ b/annotations_filtered/hpliHwPiYYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.62], [16.0, 17.41], [18.0, 18.86], [20.0, 20.93], [21.0, 23.09], [24.0, 25.14], [27.0, 27.8], [29.0, 29.79], [30.0, 32.24], [36.0, 36.9], [38.0, 39.72], [44.0, 46.03], [47.0, 48.52], [51.0, 53.23], [54.0, 55.63], [58.0, 68.27], [68.0, 69.82], [73.0, 73.95], [79.0, 79.24], [80.0, 82.38], [84.0, 83.78], [85.0, 85.89], [95.0, 96.67], [98.0, 99.62], [107.0, 109.93], [112.0, 113.17], [115.0, 117.64], [118.0, 119.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 98.73, 0.0, 98.36, 0.0, 50.51, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 76.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 1.41, 0.86, 0.93, 2.09, 1.14, 0.8, 0.79, 2.24, 0.9, 1.72, 2.03, 1.52, 2.23, 1.63, 10.27, 1.82, 0.95, 0.24, 2.38, -0.22, 0.89, 1.67, 1.62, 2.93, 1.17, 2.64, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/hplpQt424Ls_filtered.json b/annotations_filtered/hplpQt424Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ded7c58c24743547c28c8ead4b108dd7505c12bd --- /dev/null +++ b/annotations_filtered/hplpQt424Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.17], [9.0, 9.32], [11.0, 11.33], [14.0, 16.02], [17.0, 122.49], [125.0, 170.8]], "keep_status": [false, false, false, true, false, false], "silence_prob": [100.0, 0.0, 0.0, 48.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 20.43], ["fart", 10.43], ["effects unit", 9.69]], null, null], "duration": [4.17, 0.32, 0.33, 2.02, 105.49, 45.8]} \ No newline at end of file diff --git a/annotations_filtered/hprw4GtCu1w_filtered.json b/annotations_filtered/hprw4GtCu1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..603244ddec9ac3323c25bee9b4e34aa2a897c7e6 --- /dev/null +++ b/annotations_filtered/hprw4GtCu1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.49], [11.0, 19.03], [19.0, 19.09], [19.0, 19.47], [19.0, 25.59], [26.0, 26.54], [31.0, 31.18], [35.0, 35.24], [36.0, 36.27], [39.0, 40.12], [43.0, 52.66], [53.0, 53.72], [54.0, 55.04], [56.0, 56.86], [58.0, 58.21], [59.0, 60.93], [61.0, 61.33], [65.0, 65.16], [65.0, 66.55], [68.0, 68.32], [73.0, 74.66], [76.0, 79.49], [80.0, 82.05], [83.0, 83.22], [84.0, 93.63], [97.0, 97.41], [100.0, 103.03], [104.0, 106.17], [107.0, 108.8], [112.0, 113.78], [116.0, 116.67], [119.0, 120.61], [123.0, 125.46], [130.0, 139.58], [142.0, 147.26], [149.0, 153.94], [158.0, 162.7]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.67, 32.89, 0.0, 0.0, 33.73, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 62.27, 0.0, 37.02, 0.0, 55.67, 98.1, 0.0, 0.0, 0.0, 0.0, 98.51, 42.79, 39.07, 56.86, 36.39], "audiomae_on_audioset": [[["music", 37.8], ["synthesizer", 10.64], ["effects unit", 8.49]], [["music", 51.15], ["didgeridoo", 18.71], ["speech", 12.67]], null, null, [["didgeridoo", 52.26], ["music", 11.12], ["mantra", 8.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 25.83], ["speech", 17.17], ["telephone", 13.85]], null, null, [["music", 66.98], ["speech", 6.82], ["timpani", 3.54]], null, null, null, null, null, null, null, null, [["music", 55.16], ["theremin", 25.86], ["singing bowl", 2.89]], [["music", 66.56], ["theremin", 5.96], ["musical instrument", 4.09]], null, [["music", 25.21], ["throbbing", 14.93], ["hum", 14.09]]], "duration": [2.49, 8.03, 0.09, 0.47, 6.59, 0.54, 0.18, 0.24, 0.27, 1.12, 9.66, 0.72, 1.04, 0.86, 0.21, 1.93, 0.33, 0.16, 1.55, 0.32, 1.66, 3.49, 2.05, 0.22, 9.63, 0.41, 3.03, 2.17, 1.8, 1.78, 0.67, 1.61, 2.46, 9.58, 5.26, 4.94, 4.7]} \ No newline at end of file diff --git a/annotations_filtered/hq-vTEalnj0_filtered.json b/annotations_filtered/hq-vTEalnj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8c0f0a14c445aa0598406524c265723d64a4707 --- /dev/null +++ b/annotations_filtered/hq-vTEalnj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [3.0, 3.52], [5.0, 6.15], [6.0, 7.74], [12.0, 13.17], [15.0, 18.57], [20.0, 34.33], [35.0, 36.96], [38.0, 41.34], [43.0, 46.4], [49.0, 49.05], [50.0, 50.7], [56.0, 56.52], [58.0, 59.17], [61.0, 61.96], [65.0, 67.54], [68.0, 69.52], [71.0, 71.95], [74.0, 74.78], [76.0, 77.18], [83.0, 86.14], [90.0, 91.74], [95.0, 96.72], [97.0, 101.33], [103.0, 104.11], [107.0, 107.81], [109.0, 112.13], [113.0, 114.71], [117.0, 117.12], [120.0, 121.64], [123.0, 124.01], [126.0, 126.39], [128.0, 128.66], [131.0, 133.66], [134.0, 135.35], [138.0, 140.21], [141.0, 142.18], [143.0, 144.63], [146.0, 149.17], [151.0, 151.88], [154.0, 154.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 98.93, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.96, 0.0, 0.0, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 0.52, 1.15, 1.74, 1.17, 3.57, 14.33, 1.96, 3.34, 3.4, 0.05, 0.7, 0.52, 1.17, 0.96, 2.54, 1.52, 0.95, 0.78, 1.18, 3.14, 1.74, 1.72, 4.33, 1.11, 0.81, 3.13, 1.71, 0.12, 1.64, 1.01, 0.39, 0.66, 2.66, 1.35, 2.21, 1.18, 1.63, 3.17, 0.88, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/hq4lKhTXzXQ_filtered.json b/annotations_filtered/hq4lKhTXzXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..948c005ff8f0aee70b9ba04083b548af59a22a97 --- /dev/null +++ b/annotations_filtered/hq4lKhTXzXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.74], [11.0, 19.84], [20.0, 20.48], [23.0, 23.48], [25.0, 25.03], [27.0, 43.33], [46.0, 46.72], [52.0, 52.46], [57.0, 57.91], [60.0, 60.03], [61.0, 74.53], [78.0, 85.09], [85.0, 85.14], [87.0, 87.49], [90.0, 98.76]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [31.23, 31.24, 0.0, 0.0, 0.0, 29.07, 0.0, 0.0, 0.0, 0.0, 30.53, 30.65, 0.0, 0.0, 29.9], "audiomae_on_audioset": [[["music", 39.32], ["didgeridoo", 23.37], ["electric shaver, electric razor", 6.98]], [["music", 50.42], ["didgeridoo", 33.23], ["musical instrument", 6.93]], null, null, null, [["music", 34.21], ["noise", 21.54], ["didgeridoo", 7.99]], null, null, null, null, [["throbbing", 55.92], ["hum", 25.01], ["music", 12.0]], [["throbbing", 57.02], ["hum", 37.74], ["mains hum", 2.48]], null, null, [["hum", 33.77], ["throbbing", 17.19], ["speech", 10.4]]], "duration": [4.74, 8.84, 0.48, 0.48, 0.03, 16.33, 0.72, 0.46, 0.91, 0.03, 13.53, 7.09, 0.14, 0.49, 8.76]} \ No newline at end of file diff --git a/annotations_filtered/hqJxDiGXTWc_filtered.json b/annotations_filtered/hqJxDiGXTWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2609b98138ed9af79ce2c968b5b1b2fb21ffe38 --- /dev/null +++ b/annotations_filtered/hqJxDiGXTWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 22.28], [23.0, 24.29], [29.0, 31.01], [33.0, 34.37], [38.0, 41.28], [44.0, 45.76], [50.0, 51.76], [53.0, 55.8], [60.0, 60.84], [62.0, 64.69], [70.0, 72.1], [77.0, 78.07], [81.0, 81.46], [82.0, 83.56], [85.0, 86.43], [87.0, 89.14], [90.0, 123.16], [125.0, 129.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.55, 0.0, 44.72, 0.0, 54.9, 0.0, 0.0, 35.28, 0.0, 36.68, 40.24, 0.0, 0.0, 0.0, 0.0, 39.96, 0.0, 66.76], "audiomae_on_audioset": [null, null, [["music", 59.79], ["ambient music", 6.9], ["singing bowl", 3.59]], null, null, null, null, [["music", 33.52], ["gong", 30.51], ["electronic music", 6.62]], null, [["music", 30.99], ["singing bowl", 25.34], ["gong", 15.41]], [["music", 56.72], ["singing bowl", 10.22], ["ambient music", 5.55]], null, null, null, null, [["music", 54.89], ["ambient music", 12.84], ["gong", 6.15]], null, null], "duration": [19.28, 1.29, 2.01, 1.37, 3.28, 1.76, 1.76, 2.8, 0.84, 2.69, 2.1, 1.07, 0.46, 1.56, 1.43, 2.14, 33.16, 4.86]} \ No newline at end of file diff --git a/annotations_filtered/hqqlSTB5CfU_filtered.json b/annotations_filtered/hqqlSTB5CfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3606ddf89e94962f9b4f4c22c2412db6bdde15ec --- /dev/null +++ b/annotations_filtered/hqqlSTB5CfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.0], [7.0, 7.52], [9.0, 9.24], [11.0, 11.82], [13.0, 13.51], [14.0, 15.69], [22.0, 23.63], [26.0, 26.27], [28.0, 28.92], [30.0, 30.2], [31.0, 32.24], [33.0, 34.28], [36.0, 36.66], [40.0, 41.47], [42.0, 42.6], [43.0, 44.32], [45.0, 45.37], [46.0, 49.47], [50.0, 51.14], [53.0, 54.03], [57.0, 58.06], [60.0, 62.55], [63.0, 63.69], [65.0, 66.24], [68.0, 69.58], [71.0, 72.13], [72.0, 72.72], [74.0, 74.63], [76.0, 77.16], [78.0, 78.61], [79.0, 80.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.52, 0.24, 0.82, 0.51, 1.69, 1.63, 0.27, 0.92, 0.2, 1.24, 1.28, 0.66, 1.47, 0.6, 1.32, 0.37, 3.47, 1.14, 1.03, 1.06, 2.55, 0.69, 1.24, 1.58, 1.13, 0.72, 0.63, 1.16, 0.61, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/hqslb1FVoQQ_filtered.json b/annotations_filtered/hqslb1FVoQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d66d3c31b3cf276b167fd02289e792c48bf1ad7 --- /dev/null +++ b/annotations_filtered/hqslb1FVoQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 21.46], [25.0, 33.44], [37.0, 37.54], [43.0, 46.01], [49.0, 49.22], [58.0, 59.59], [66.0, 66.82], [70.0, 72.39], [82.0, 86.68], [89.0, 92.1], [112.0, 113.17], [114.0, 115.6]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [34.56, 35.2, 0.0, 93.6, 0.0, 0.0, 0.0, 77.2, 39.54, 33.88, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.06], ["hum", 11.87], ["synthesizer", 10.76]], [["hum", 46.12], ["music", 17.15], ["mains hum", 13.87]], null, null, null, null, null, null, [["speech", 42.78], ["music", 37.77], ["timpani", 2.78]], [["music", 47.61], ["speech", 10.72], ["drum", 2.66]], null, null], "duration": [13.46, 8.44, 0.54, 3.01, 0.22, 1.59, 0.82, 2.39, 4.68, 3.1, 1.17, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/hrZxBMTQO0c_filtered.json b/annotations_filtered/hrZxBMTQO0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5eda6b0af1dfc0a69f34f67bbfdaaa86de25aa1e --- /dev/null +++ b/annotations_filtered/hrZxBMTQO0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 42.8], [47.0, 61.3], [65.0, 73.03]], "keep_status": [false, false, true], "silence_prob": [0.0, 31.19, 33.34], "audiomae_on_audioset": [null, [["machine gun", 67.28], ["gunshot, gunfire", 24.17], ["speech", 1.54]], [["music", 34.79], ["speech", 15.8], ["throbbing", 7.5]]], "duration": [32.8, 14.3, 8.03]} \ No newline at end of file diff --git a/annotations_filtered/hrcFkSMZBng_filtered.json b/annotations_filtered/hrcFkSMZBng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b89b0c99971622064d8951a0fb0039bcabb2655 --- /dev/null +++ b/annotations_filtered/hrcFkSMZBng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.53], [6.0, 11.92], [13.0, 14.77], [16.0, 17.04], [17.0, 17.42], [18.0, 21.0], [23.0, 24.39], [25.0, 29.67], [33.0, 42.77], [44.0, 44.83], [46.0, 47.33], [52.0, 55.73], [57.0, 59.26], [61.0, 64.02], [68.0, 68.08], [71.0, 75.15], [77.0, 82.51], [85.0, 86.32], [88.0, 88.72], [94.0, 96.82], [99.0, 99.18], [105.0, 117.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.57, 0.0, 0.0, 0.0, 77.87, 0.0, 76.7, 60.32, 0.0, 0.0, 96.89, 39.78, 99.78, 0.0, 94.22, 81.53, 0.0, 0.0, 58.81, 0.0, 95.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.59], ["breaking", 14.8], ["music", 4.93]], null, null, null, null, null, null, null, null, null], "duration": [1.53, 5.92, 1.77, 1.04, 0.42, 3.0, 1.39, 4.67, 9.77, 0.83, 1.33, 3.73, 2.26, 3.02, 0.08, 4.15, 5.51, 1.32, 0.72, 2.82, 0.18, 12.24]} \ No newline at end of file diff --git a/annotations_filtered/hsBtuhWw7RM_filtered.json b/annotations_filtered/hsBtuhWw7RM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97c29d15210ea29858356197a01e2e362f49e970 --- /dev/null +++ b/annotations_filtered/hsBtuhWw7RM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.6], [23.0, 23.85], [37.0, 39.48], [41.0, 43.34], [47.0, 47.9], [51.0, 52.96], [54.0, 62.29], [66.0, 65.89], [67.0, 66.85], [68.0, 69.13], [70.0, 72.13], [77.0, 78.11], [81.0, 80.91], [82.0, 83.19], [85.0, 85.85], [99.0, 100.53], [105.0, 105.0], [119.0, 119.08], [124.0, 136.29]], "keep_status": [false, false, true, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.34, 55.39, 0.0, 0.0, 37.81, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.15], "audiomae_on_audioset": [null, null, [["music", 33.18], ["singing", 4.45], ["meow", 4.17]], null, null, null, [["hum", 23.06], ["mains hum", 16.55], ["music", 11.49]], null, null, null, [["sidetone", 16.56], ["whale vocalization", 16.32], ["music", 12.26]], null, null, null, null, null, null, null, [["music", 38.53], ["synthesizer", 16.25], ["theremin", 7.26]]], "duration": [0.6, 0.85, 2.48, 2.34, 0.9, 1.96, 8.29, -0.11, -0.15, 1.13, 2.13, 1.11, -0.09, 1.19, 0.85, 1.53, 0.0, 0.08, 12.29]} \ No newline at end of file diff --git a/annotations_filtered/hsE1N5mfvmA_filtered.json b/annotations_filtered/hsE1N5mfvmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a59cda83ae259e957992a27e6532435d9aeb34c8 --- /dev/null +++ b/annotations_filtered/hsE1N5mfvmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.06], [14.0, 29.98], [31.0, 32.56], [37.0, 52.76], [58.0, 84.91], [87.0, 87.72], [91.0, 94.56], [99.0, 101.98], [102.0, 102.02], [103.0, 108.99], [110.0, 111.96], [115.0, 115.37], [117.0, 118.2], [122.0, 122.69], [123.0, 124.01]], "keep_status": [false, false, false, false, true, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 92.97, 0.0, 34.82, 39.49, 0.0, 29.73, 30.55, 0.0, 41.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.77], ["musical instrument", 6.39], ["synthesizer", 5.88]], [["music", 53.93], ["musical instrument", 6.5], ["theremin", 6.19]], null, [["music", 33.65], ["noise", 12.58], ["synthesizer", 4.73]], [["sine wave", 36.66], ["noise", 9.0], ["explosion", 8.67]], null, [["music", 28.05], ["speech", 18.94], ["hum", 11.58]], null, null, null, null, null], "duration": [0.06, 15.98, 1.56, 15.76, 26.91, 0.72, 3.56, 2.98, 0.02, 5.99, 1.96, 0.37, 1.2, 0.69, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/hsIdl6x2Lck_filtered.json b/annotations_filtered/hsIdl6x2Lck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f24eefc91e8d07e34f89c014b66fb5432d1378d --- /dev/null +++ b/annotations_filtered/hsIdl6x2Lck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [3.0, 5.56], [6.0, 17.71], [19.0, 28.24], [29.0, 33.44], [34.0, 35.8], [36.0, 39.36], [41.0, 45.67], [47.0, 69.62], [71.0, 71.95], [73.0, 78.7], [81.0, 97.44], [99.0, 99.52], [100.0, 99.55], [100.0, 99.96], [100.0, 99.99], [100.0, 100.33], [100.0, 100.6], [101.0, 103.64], [104.0, 105.87], [106.0, 106.25], [114.0, 117.54], [121.0, 127.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 65.79, 58.3, 71.43, 43.87, 0.0, 75.39, 77.36, 33.33, 0.0, 59.59, 31.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 32.25, 51.28], "audiomae_on_audioset": [null, null, null, null, [["speech", 64.01], ["sonar", 6.88], ["hum", 3.72]], null, null, null, [["music", 65.85], ["mechanisms", 7.95], ["mains hum", 4.66]], null, null, [["hum", 25.17], ["speech", 18.59], ["music", 17.54]], null, null, null, null, null, null, [["mains hum", 22.92], ["music", 21.28], ["hum", 19.93]], null, null, [["music", 31.29], ["cattle, bovinae", 14.75], ["moo", 14.19]], null], "duration": [0.45, 2.56, 11.71, 9.24, 4.44, 1.8, 3.36, 4.67, 22.62, 0.95, 5.7, 16.44, 0.52, -0.45, -0.04, -0.01, 0.33, 0.6, 2.64, 1.87, 0.25, 3.54, 6.65]} \ No newline at end of file diff --git a/annotations_filtered/hsxRROsF4D0_filtered.json b/annotations_filtered/hsxRROsF4D0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0b1c802d8993941a3538d8c7f6674acb5c44faa --- /dev/null +++ b/annotations_filtered/hsxRROsF4D0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.85], [19.0, 46.52], [49.0, 49.65], [51.0, 54.38], [55.0, 57.16], [60.0, 60.37], [62.0, 63.91], [67.0, 71.51], [72.0, 73.33], [74.0, 76.05], [78.0, 78.12], [80.0, 80.3], [84.0, 84.05], [95.0, 99.22], [100.0, 100.67], [121.0, 121.44], [135.0, 136.09], [137.0, 138.01], [140.0, 139.94], [141.0, 146.15], [149.0, 150.09], [164.0, 165.2], [169.0, 170.31]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 35.69, 0.0, 38.94, 39.11, 0.0, 0.0, 46.5, 0.0, 54.83, 0.0, 0.0, 0.0, 31.31, 0.0, 0.0, 0.0, 0.0, 0.0, 39.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 47.15], ["mains hum", 38.68], ["music", 5.58]], null, [["speech", 44.61], ["hum", 6.57], ["radio", 6.48]], [["speech", 27.83], ["hum", 20.76], ["mains hum", 10.55]], null, null, [["mains hum", 18.47], ["speech", 16.79], ["hum", 16.68]], null, null, null, null, null, [["music", 11.71], ["whack, thwack", 7.96], ["hum", 6.77]], null, null, null, null, null, [["fly, housefly", 21.55], ["hum", 16.59], ["mosquito", 11.76]], null, null, null], "duration": [1.85, 27.52, 0.65, 3.38, 2.16, 0.37, 1.91, 4.51, 1.33, 2.05, 0.12, 0.3, 0.05, 4.22, 0.67, 0.44, 1.09, 1.01, -0.06, 5.15, 1.09, 1.2, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/htCHOTJBiSc_filtered.json b/annotations_filtered/htCHOTJBiSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1f0539035515874bf1cc0481cb8e116a064218d --- /dev/null +++ b/annotations_filtered/htCHOTJBiSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [11.0, 11.43], [14.0, 15.03], [23.0, 23.31], [26.0, 27.13], [28.0, 29.15], [31.0, 32.48], [33.0, 34.1], [35.0, 36.05], [46.0, 46.38], [49.0, 49.25], [50.0, 52.66], [53.0, 53.96], [60.0, 60.44], [66.0, 65.91], [71.0, 72.32], [73.0, 75.0], [76.0, 76.32], [77.0, 77.99], [84.0, 83.94], [86.0, 87.07], [88.0, 91.76], [93.0, 93.87], [96.0, 96.35], [97.0, 97.71], [100.0, 100.53], [104.0, 104.5], [107.0, 107.52], [111.0, 111.28], [114.0, 114.57], [117.0, 117.64], [124.0, 128.78], [130.0, 130.08], [133.0, 135.01], [139.0, 139.94], [141.0, 140.64], [143.0, 142.97], [146.0, 147.24], [158.0, 158.77], [159.0, 161.3], [166.0, 166.41], [173.0, 175.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.43, 1.03, 0.31, 1.13, 1.15, 1.48, 1.1, 1.05, 0.38, 0.25, 2.66, 0.96, 0.44, -0.09, 1.32, 2.0, 0.32, 0.99, -0.06, 1.07, 3.76, 0.87, 0.35, 0.71, 0.53, 0.5, 0.52, 0.28, 0.57, 0.64, 4.78, 0.08, 2.01, 0.94, -0.36, -0.03, 1.24, 0.77, 2.3, 0.41, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/htHKbsUKDDw_filtered.json b/annotations_filtered/htHKbsUKDDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca486ccdf7f9a280d82dfe65fd73ad1042bc5036 --- /dev/null +++ b/annotations_filtered/htHKbsUKDDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.42], [13.0, 13.93], [17.0, 17.27], [21.0, 20.75], [23.0, 24.76], [30.0, 31.06], [36.0, 36.32], [39.0, 41.86], [50.0, 52.64], [53.0, 53.81], [58.0, 58.4], [63.0, 67.8], [77.0, 77.16], [83.0, 83.13], [86.0, 86.85], [88.0, 88.62], [91.0, 96.58], [99.0, 105.87], [107.0, 108.31], [115.0, 115.69], [120.0, 121.31], [127.0, 127.58], [133.0, 133.12], [141.0, 143.65], [147.0, 148.47], [154.0, 155.12], [158.0, 159.44], [172.0, 173.03], [175.0, 175.56], [178.0, 178.75], [184.0, 184.37], [187.0, 187.83], [191.0, 191.39], [194.0, 195.76], [196.0, 197.5], [200.0, 200.3], [204.0, 204.15], [212.0, 212.21], [215.0, 232.61], [237.0, 241.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.26, 49.0, 0.0, 0.0, 36.29, 0.0, 0.0, 0.0, 0.0, 38.55, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 30.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.91, 47.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 82.75], ["musical instrument", 1.14], ["electronic music", 1.04]], [["music", 59.66], ["throbbing", 9.77], ["hum", 5.6]], null, null, [["speech", 47.86], ["typewriter", 13.85], ["music", 13.56]], null, null, null, null, [["speech", 40.1], ["music", 15.72], ["whale vocalization", 4.06]], [["music", 59.07], ["speech", 16.17], ["musical instrument", 5.76]], null, null, null, null, null, [["coin (dropping)", 33.69], ["ding", 26.97], ["clang", 13.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.78], ["throbbing", 24.15], ["hum", 20.69]], [["bee, wasp, etc.", 22.17], ["fly, housefly", 13.52], ["hum", 8.62]]], "duration": [3.42, 0.93, 0.27, -0.25, 1.76, 1.06, 0.32, 2.86, 2.64, 0.81, 0.4, 4.8, 0.16, 0.13, 0.85, 0.62, 5.58, 6.87, 1.31, 0.69, 1.31, 0.58, 0.12, 2.65, 1.47, 1.12, 1.44, 1.03, 0.56, 0.75, 0.37, 0.83, 0.39, 1.76, 1.5, 0.3, 0.15, 0.21, 17.61, 4.78]} \ No newline at end of file diff --git a/annotations_filtered/hu2AlkyvIe0_filtered.json b/annotations_filtered/hu2AlkyvIe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e131fe2453f54d0ae3b06d190b54c7864d4e0b --- /dev/null +++ b/annotations_filtered/hu2AlkyvIe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [9.0, 10.08], [14.0, 26.96], [28.0, 28.76], [31.0, 37.47], [39.0, 48.54], [52.0, 53.55], [55.0, 55.78], [60.0, 60.79], [65.0, 65.89], [70.0, 70.39], [76.0, 76.67], [97.0, 98.93]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.74, 0.0, 32.41, 30.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 22.52], ["livestock, farm animals, working animals", 18.35], ["speech", 14.12]], null, [["speech", 34.23], ["music", 33.18], ["crowd", 4.84]], [["speech", 30.11], ["foghorn", 16.27], ["music", 15.97]], null, null, null, null, null, null, null], "duration": [0.37, 1.08, 12.96, 0.76, 6.47, 9.54, 1.55, 0.78, 0.79, 0.89, 0.39, 0.67, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/huI39DZ4b44_filtered.json b/annotations_filtered/huI39DZ4b44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dea2ff3555ce92ab4db71a7a37431f3e65698093 --- /dev/null +++ b/annotations_filtered/huI39DZ4b44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.21], [14.0, 24.87], [26.0, 26.86], [27.0, 31.5], [34.0, 57.86], [60.0, 69.15], [72.0, 106.49], [110.0, 145.0]], "keep_status": [false, false, false, false, true, true, false, false], "silence_prob": [0.0, 29.26, 0.0, 29.29, 28.3, 28.09, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.34], ["hum", 23.19], ["mains hum", 12.32]], null, [["music", 60.83], ["speech", 10.32], ["throbbing", 7.72]], [["livestock, farm animals, working animals", 19.92], ["cattle, bovinae", 7.44], ["vehicle", 7.21]], [["speech", 32.05], ["eruption", 13.15], ["explosion", 12.63]], null, null], "duration": [0.21, 10.87, 0.86, 4.5, 23.86, 9.15, 34.49, 35.0]} \ No newline at end of file diff --git a/annotations_filtered/huOZPQ6Hl2c_filtered.json b/annotations_filtered/huOZPQ6Hl2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4836b29a8f1d5f302f83ac9ee1853ea373103fd --- /dev/null +++ b/annotations_filtered/huOZPQ6Hl2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.9], [10.0, 34.94], [43.0, 43.14], [45.0, 45.57], [47.0, 47.56], [49.0, 49.17], [50.0, 54.08], [54.0, 56.17], [57.0, 57.43], [63.0, 75.37], [77.0, 77.36], [79.0, 85.28], [87.0, 95.44], [96.0, 96.65]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 36.28, 0.0, 0.0, 0.0, 0.0, 33.83, 40.77, 0.0, 35.78, 0.0, 32.02, 31.75, 0.0], "audiomae_on_audioset": [null, [["music", 46.58], ["sidetone", 11.76], ["speech", 5.27]], null, null, null, null, [["music", 22.76], ["whack, thwack", 9.81], ["thunk", 9.32]], [["livestock, farm animals, working animals", 17.73], ["cattle, bovinae", 16.23], ["moo", 9.31]], null, [["speech", 70.76], ["whack, thwack", 5.1], ["fly, housefly", 1.9]], null, [["fly, housefly", 20.32], ["speech", 15.81], ["mains hum", 11.35]], [["speech", 77.65], ["explosion", 8.68], ["burst, pop", 1.78]], null], "duration": [-0.1, 24.94, 0.14, 0.57, 0.56, 0.17, 4.08, 2.17, 0.43, 12.37, 0.36, 6.28, 8.44, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/hudgzkYfSvU_filtered.json b/annotations_filtered/hudgzkYfSvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97803a59c4c655345609a148dbac5b8090fd56ad --- /dev/null +++ b/annotations_filtered/hudgzkYfSvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.38], [14.0, 15.69], [21.0, 23.75], [32.0, 31.92], [35.0, 38.33], [41.0, 41.81], [47.0, 48.37], [57.0, 57.18], [59.0, 59.37], [76.0, 76.72], [79.0, 81.77], [84.0, 85.23], [94.0, 94.14], [104.0, 104.75], [106.0, 107.08], [109.0, 111.57], [114.0, 115.5], [124.0, 124.56], [128.0, 129.22]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [54.43, 0.0, 38.36, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 33.88, 0.0, 0.0, 0.0, 0.0, 33.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.12], ["mains hum", 18.41], ["didgeridoo", 17.61]], null, null, null, null, null, null, null, [["speech", 23.63], ["music", 19.0], ["hum", 6.01]], null, null, null, null, [["speech", 32.8], ["civil defense siren", 27.92], ["siren", 12.17]], null, null, null], "duration": [7.38, 1.69, 2.75, -0.08, 3.33, 0.81, 1.37, 0.18, 0.37, 0.72, 2.77, 1.23, 0.14, 0.75, 1.08, 2.57, 1.5, 0.56, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/huvEARIzQNc_filtered.json b/annotations_filtered/huvEARIzQNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5d79ac8b86051d75b079cc4b683568984e24b9c --- /dev/null +++ b/annotations_filtered/huvEARIzQNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.35], [7.0, 6.78], [8.0, 7.92], [9.0, 9.85], [13.0, 13.85], [16.0, 15.65], [17.0, 18.76], [19.0, 20.38], [21.0, 26.33], [28.0, 30.25], [37.0, 37.59], [43.0, 43.75], [46.0, 47.19], [51.0, 51.19], [58.0, 58.35], [62.0, 63.0], [68.0, 71.88], [72.0, 73.16], [74.0, 77.9], [78.0, 80.33], [81.0, 92.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 89.54, 70.86, 57.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, -0.22, -0.08, 0.85, 0.85, -0.35, 1.76, 1.38, 5.33, 2.25, 0.59, 0.75, 1.19, 0.19, 0.35, 1.0, 3.88, 1.16, 3.9, 2.33, 11.65]} \ No newline at end of file diff --git a/annotations_filtered/huxXgcGvTPk_filtered.json b/annotations_filtered/huxXgcGvTPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e900fb3b3da6d40a23527704808fea4f3dbdef7 --- /dev/null +++ b/annotations_filtered/huxXgcGvTPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.48], [21.0, 21.1], [22.0, 40.1], [41.0, 51.95], [54.0, 60.56], [66.0, 66.46], [79.0, 79.27], [81.0, 81.7], [85.0, 85.26], [87.0, 88.03], [97.0, 97.75], [107.0, 107.35], [108.0, 108.65], [110.0, 110.89], [120.0, 120.9], [122.0, 123.67], [124.0, 125.19], [127.0, 127.57], [129.0, 130.0], [133.0, 134.81], [136.0, 139.24], [139.0, 139.48], [139.0, 139.51], [140.0, 141.05], [146.0, 145.79], [146.0, 148.07], [151.0, 160.19], [165.0, 165.42], [166.0, 166.95], [169.0, 169.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [54.04, 0.0, 68.15, 41.1, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.63, 0.0, 0.0, 0.0, 0.0, 40.36, 30.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.2], ["hum", 6.35], ["mains hum", 2.32]], [["hum", 40.69], ["music", 25.37], ["throbbing", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.57], ["throbbing", 11.19], ["hum", 10.15]], null, null, null, null, [["music", 54.5], ["speech", 8.66], ["hum", 6.43]], [["music", 52.22], ["hum", 11.03], ["mains hum", 8.05]], null, null, null], "duration": [8.48, 0.1, 18.1, 10.95, 6.56, 0.46, 0.27, 0.7, 0.26, 1.03, 0.75, 0.35, 0.65, 0.89, 0.9, 1.67, 1.19, 0.57, 1.0, 1.81, 3.24, 0.48, 0.51, 1.05, -0.21, 2.07, 9.19, 0.42, 0.95, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/hvACHvnVCbw_filtered.json b/annotations_filtered/hvACHvnVCbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ef97b3a1ebd3bf033786c9f81ab2fc54f987e7 --- /dev/null +++ b/annotations_filtered/hvACHvnVCbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 39.46], [46.0, 46.08], [47.0, 47.71], [48.0, 49.98], [51.0, 52.78], [53.0, 58.53], [59.0, 59.8], [61.0, 63.46], [64.0, 64.69], [65.0, 73.47], [74.0, 76.23], [77.0, 77.89], [78.0, 80.69], [82.0, 82.19], [84.0, 87.84], [89.0, 98.69], [102.0, 106.56], [110.0, 111.67], [112.0, 113.27], [114.0, 114.91], [119.0, 119.16], [120.0, 123.67], [126.0, 126.17], [131.0, 154.28], [157.0, 159.58], [164.0, 172.15]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, true, false, true, false, false], "silence_prob": [29.42, 0.0, 0.0, 0.0, 0.0, 46.36, 0.0, 50.02, 0.0, 43.25, 43.3, 0.0, 31.72, 0.0, 29.24, 28.66, 28.97, 0.0, 0.0, 0.0, 0.0, 29.85, 0.0, 31.18, 61.77, 53.34], "audiomae_on_audioset": [[["music", 13.2], ["animal", 9.73], ["speech", 8.8]], null, null, null, null, [["hum", 19.12], ["mains hum", 10.76], ["sidetone", 10.22]], null, null, null, [["speech", 35.55], ["sidetone", 35.42], ["hum", 6.37]], [["speech", 53.75], ["sidetone", 17.19], ["radio", 8.6]], null, [["speech", 38.46], ["hum", 9.11], ["music", 7.38]], null, [["explosion", 23.5], ["boom", 20.13], ["hum", 11.37]], [["speech", 43.1], ["music", 12.22], ["whack, thwack", 5.91]], [["music", 21.19], ["rumble", 21.02], ["hum", 18.08]], null, null, null, null, [["whale vocalization", 46.24], ["music", 3.37], ["rumble", 2.87]], null, [["speech", 23.17], ["hum", 16.0], ["livestock, farm animals, working animals", 8.51]], null, null], "duration": [13.46, 0.08, 0.71, 1.98, 1.78, 5.53, 0.8, 2.46, 0.69, 8.47, 2.23, 0.89, 2.69, 0.19, 3.84, 9.69, 4.56, 1.67, 1.27, 0.91, 0.16, 3.67, 0.17, 23.28, 2.58, 8.15]} \ No newline at end of file diff --git a/annotations_filtered/hvZiZFDE3A8_filtered.json b/annotations_filtered/hvZiZFDE3A8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fb2010580854e6ff92b681305ef3c01d61bc88c --- /dev/null +++ b/annotations_filtered/hvZiZFDE3A8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 54.72], [66.0, 67.63], [69.0, 70.36], [71.0, 75.03], [79.0, 79.34], [80.0, 80.99], [82.0, 84.03], [88.0, 88.11]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.52, 0.0, 0.0, 35.47, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.52], ["speech", 15.25], ["didgeridoo", 6.13]], null, null, [["music", 68.44], ["musical instrument", 2.22], ["electronic music", 1.64]], null], "duration": [0.72, 1.63, 1.36, 4.03, 0.34, 0.99, 2.03, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/hv_mYkUEGko_filtered.json b/annotations_filtered/hv_mYkUEGko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abf7924a11a4c84d152424592bab5bb6b8055bc2 --- /dev/null +++ b/annotations_filtered/hv_mYkUEGko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.7], [26.0, 31.38], [36.0, 36.78], [39.0, 39.11], [46.0, 49.81], [52.0, 51.87], [53.0, 53.54], [54.0, 54.82], [56.0, 56.79], [71.0, 71.02], [73.0, 73.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.61, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 64.27], ["synthesizer", 20.27], ["musical instrument", 4.89]], null, null, [["fart", 52.4], ["speech", 14.12], ["boing", 6.9]], null, null, null, null, null, null], "duration": [0.7, 5.38, 0.78, 0.11, 3.81, -0.13, 0.54, 0.82, 0.79, 0.02, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/hvuQCnADQRM_filtered.json b/annotations_filtered/hvuQCnADQRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edf4688ef420a5d4609c47285d5e6d73e58588d3 --- /dev/null +++ b/annotations_filtered/hvuQCnADQRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.51], [7.0, 7.37], [10.0, 11.21], [14.0, 14.74], [16.0, 23.35], [26.0, 29.39], [30.0, 34.25], [36.0, 36.36], [40.0, 61.75], [62.0, 72.71], [73.0, 74.26], [77.0, 77.45], [78.0, 83.56], [84.0, 85.67], [87.0, 86.7], [87.0, 88.62], [89.0, 89.18], [93.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 35.54, 82.97, 0.0, 40.88, 30.47, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 36.93], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 62.26], ["moo", 27.02], ["livestock, farm animals, working animals", 9.05]], null, null, [["howl", 32.86], ["animal", 9.17], ["livestock, farm animals, working animals", 7.32]], [["car", 18.59], ["vehicle", 16.72], ["skidding", 15.23]], null, null, null, null, null, null, null, [["speech", 27.0], ["snicker", 13.41], ["animal", 6.9]]], "duration": [0.89, 0.51, 0.37, 1.21, 0.74, 7.35, 3.39, 4.25, 0.36, 21.75, 10.71, 1.26, 0.45, 5.56, 1.67, -0.3, 1.62, 0.18, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/hvvTxyks7L8_filtered.json b/annotations_filtered/hvvTxyks7L8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91f9b872f9eb43258638a6da7a7efb11f469bcf6 --- /dev/null +++ b/annotations_filtered/hvvTxyks7L8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [8.0, 26.16], [39.0, 58.14], [61.0, 62.51], [66.0, 71.49], [73.0, 79.52], [81.0, 98.93], [99.0, 98.96]], "keep_status": [false, false, false, false, true, false, true, false], "silence_prob": [0.0, 99.99, 98.51, 0.0, 44.63, 99.95, 37.31, 0.0], "audiomae_on_audioset": [null, null, null, null, [["water", 27.0], ["liquid", 17.83], ["squish", 10.49]], null, [["music", 35.53], ["theremin", 21.8], ["speech", 10.28]], null], "duration": [0.21, 18.16, 19.14, 1.51, 5.49, 6.52, 17.93, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/hw3lBV-89M0_filtered.json b/annotations_filtered/hw3lBV-89M0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0734ab3431ec925cc8e29de7c94d3d629d8243f9 --- /dev/null +++ b/annotations_filtered/hw3lBV-89M0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.53], [9.0, 9.53], [11.0, 13.54], [17.0, 17.36], [20.0, 20.7], [23.0, 23.46], [27.0, 28.7], [35.0, 35.19], [47.0, 47.39], [54.0, 56.54], [58.0, 58.5], [60.0, 60.64], [62.0, 63.05], [64.0, 64.71], [74.0, 74.85]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 34.87], ["synthesizer", 5.02], ["fart", 3.62]], null, null, null, null, null, null, [["music", 56.31], ["synthesizer", 12.79], ["sampler", 3.2]], null, null, null, null, null], "duration": [0.53, 0.53, 2.54, 0.36, 0.7, 0.46, 1.7, 0.19, 0.39, 2.54, 0.5, 0.64, 1.05, 0.71, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/hw6GwhfNl7U_filtered.json b/annotations_filtered/hw6GwhfNl7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ac5d461d3f7707f6afbdb2a563f12d96d5f8379 --- /dev/null +++ b/annotations_filtered/hw6GwhfNl7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [8.0, 16.01], [20.0, 28.98], [30.0, 30.94], [33.0, 37.71], [44.0, 45.47], [47.0, 67.15], [69.0, 86.9], [89.0, 88.89], [90.0, 91.42], [92.0, 96.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 32.96, 32.98, 0.0, 29.83, 0.0, 32.71, 31.66, 0.0, 0.0, 43.35], "audiomae_on_audioset": [null, [["gong", 55.14], ["fly, housefly", 11.91], ["music", 5.81]], [["didgeridoo", 58.46], ["music", 19.9], ["speech", 6.97]], null, [["music", 50.99], ["hum", 13.95], ["mains hum", 5.31]], null, [["music", 48.92], ["speech", 16.55], ["groan", 7.24]], [["music", 64.18], ["scary music", 8.48], ["ambient music", 3.27]], null, null, [["music", 42.39], ["hiccup", 5.2], ["speech", 4.9]]], "duration": [1.28, 8.01, 8.98, 0.94, 4.71, 1.47, 20.15, 17.9, -0.11, 1.42, 4.52]} \ No newline at end of file diff --git a/annotations_filtered/hwTf9WurF4U_filtered.json b/annotations_filtered/hwTf9WurF4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2bc5b8e2636f2a00ba5c56b552f579b0b28657 --- /dev/null +++ b/annotations_filtered/hwTf9WurF4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.31], [12.0, 14.94], [16.0, 16.73], [21.0, 29.44], [35.0, 35.61], [37.0, 37.91], [39.0, 41.44], [47.0, 47.24], [49.0, 57.45], [58.0, 83.24], [84.0, 125.91], [129.0, 131.82], [134.0, 154.36]], "keep_status": [false, true, false, false, false, false, true, false, true, true, false, true, false], "silence_prob": [51.99, 38.8, 0.0, 30.17, 0.0, 0.0, 30.59, 0.0, 31.11, 30.25, 0.0, 28.67, 29.82], "audiomae_on_audioset": [null, [["fly, housefly", 32.96], ["mosquito", 15.18], ["insect", 14.27]], null, [["music", 63.19], ["drum", 5.72], ["theremin", 5.32]], null, null, [["music", 39.45], ["boing", 12.76], ["whip", 6.2]], null, [["speech", 25.92], ["music", 23.2], ["hum", 10.21]], [["mains hum", 29.36], ["speech", 17.18], ["hum", 14.24]], null, [["hum", 34.06], ["mains hum", 22.84], ["throbbing", 6.99]], [["music", 63.3], ["buzz", 8.59], ["mains hum", 6.0]]], "duration": [4.31, 2.94, 0.73, 8.44, 0.61, 0.91, 2.44, 0.24, 8.45, 25.24, 41.91, 2.82, 20.36]} \ No newline at end of file diff --git a/annotations_filtered/hwb1MK66new_filtered.json b/annotations_filtered/hwb1MK66new_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cadd8c51a8fe2ac84a79c25f67e74e8bef07e26a --- /dev/null +++ b/annotations_filtered/hwb1MK66new_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 73.7], [81.0, 84.67], [89.0, 90.75], [93.0, 118.15]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 29.05, 0.0, 31.0], "audiomae_on_audioset": [null, [["music", 12.81], ["speech", 12.64], ["fly, housefly", 12.05]], null, [["rumble", 23.2], ["speech", 14.06], ["whale vocalization", 11.04]]], "duration": [54.7, 3.67, 1.75, 25.15]} \ No newline at end of file diff --git a/annotations_filtered/hwc74Ns9EZI_filtered.json b/annotations_filtered/hwc74Ns9EZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c52dfc5b2bd7e126b2e6c42a6ba7b144af7127 --- /dev/null +++ b/annotations_filtered/hwc74Ns9EZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.07], [6.0, 16.78], [24.0, 26.06], [31.0, 32.48], [34.0, 35.95], [39.0, 50.4], [52.0, 53.11], [55.0, 55.26]], "keep_status": [true, false, false, false, false, true, false, false], "silence_prob": [40.45, 54.04, 60.7, 0.0, 0.0, 30.12, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 14.59], ["music", 14.55], ["chirp tone", 12.84]], null, null, null, null, [["music", 45.6], ["cattle, bovinae", 6.37], ["speech", 6.18]], null, null], "duration": [2.07, 10.78, 2.06, 1.48, 1.95, 11.4, 1.11, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/hweZTM7VPbk_filtered.json b/annotations_filtered/hweZTM7VPbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec60131dc9da5d0be9bf4b104e35b8680d663eaa --- /dev/null +++ b/annotations_filtered/hweZTM7VPbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [5.0, 5.66], [6.0, 8.8], [9.0, 13.88], [18.0, 18.3], [25.0, 26.79], [34.0, 34.23], [38.0, 42.9], [43.0, 44.12], [44.0, 46.55], [52.0, 53.08], [54.0, 54.43], [55.0, 56.98], [58.0, 58.83], [60.0, 60.96], [62.0, 63.15], [65.0, 64.72], [66.0, 67.86], [73.0, 82.81], [84.0, 89.48], [91.0, 93.82], [96.0, 98.37], [99.0, 99.84], [109.0, 111.96], [117.0, 116.92], [124.0, 124.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 92.31, 74.6, 0.0, 0.0, 0.0, 64.63, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.89, 32.37, 41.07, 36.99, 0.0, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.9], ["synthesizer", 8.07], ["didgeridoo", 5.06]], [["music", 33.63], ["speech", 8.99], ["trombone", 6.66]], [["music", 63.59], ["synthesizer", 6.59], ["speech", 4.93]], [["music", 40.72], ["speech", 24.39], ["synthesizer", 9.66]], null, [["music", 33.39], ["speech", 21.97], ["theremin", 13.82]], null, null], "duration": [1.43, 0.66, 2.8, 4.88, 0.3, 1.79, 0.23, 4.9, 1.12, 2.55, 1.08, 0.43, 1.98, 0.83, 0.96, 1.15, -0.28, 1.86, 9.81, 5.48, 2.82, 2.37, 0.84, 2.96, -0.08, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/hwevrtap9AY_filtered.json b/annotations_filtered/hwevrtap9AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3f234356862f12ba67b6bb295598b61bd1297fc --- /dev/null +++ b/annotations_filtered/hwevrtap9AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[72.0, 71.52], [73.0, 76.15], [80.0, 90.81]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.13, 30.87], "audiomae_on_audioset": [null, [["music", 71.54], ["throbbing", 4.14], ["noise", 3.32]], [["throbbing", 39.63], ["hum", 22.6], ["music", 22.29]]], "duration": [-0.48, 3.15, 10.81]} \ No newline at end of file diff --git a/annotations_filtered/hwpHOq3Xbks_filtered.json b/annotations_filtered/hwpHOq3Xbks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ea8bddd3209129d2e05e9bb8719fd7eac2a9f6c --- /dev/null +++ b/annotations_filtered/hwpHOq3Xbks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.97], [4.0, 4.6], [7.0, 9.95], [12.0, 12.78], [15.0, 15.58], [17.0, 16.88], [18.0, 24.49], [31.0, 30.72], [31.0, 36.42], [39.0, 39.07], [43.0, 44.32], [48.0, 49.15], [50.0, 53.22], [54.0, 54.95], [56.0, 56.88], [59.0, 59.44], [60.0, 60.0], [63.0, 71.02], [73.0, 78.44], [80.0, 103.06], [103.0, 108.24], [112.0, 111.59], [112.0, 126.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 61.67, 0.0, 41.16, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 42.88, 41.48, 31.73, 30.11, 0.0, 32.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 56.66], ["speech", 22.97], ["theremin", 4.42]], null, null, null, null, null, null, null, null, [["music", 60.24], ["throbbing", 21.72], ["electronic music", 4.89]], [["throbbing", 49.54], ["music", 23.14], ["hum", 20.05]], [["music", 64.57], ["speech", 8.53], ["electronic music", 3.63]], [["speech", 37.04], ["music", 24.06], ["vehicle", 11.48]], null, [["fly, housefly", 14.79], ["music", 14.02], ["insect", 11.33]]], "duration": [-0.03, 0.6, 2.95, 0.78, 0.58, -0.12, 6.49, -0.28, 5.42, 0.07, 1.32, 1.15, 3.22, 0.95, 0.88, 0.44, 0.0, 8.02, 5.44, 23.06, 5.24, -0.41, 14.93]} \ No newline at end of file diff --git a/annotations_filtered/hxi06yeErvk_filtered.json b/annotations_filtered/hxi06yeErvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4c4c24217cbbe1c06cb9bb7824672fddacad8ac --- /dev/null +++ b/annotations_filtered/hxi06yeErvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.63], [1.0, 0.67], [1.0, 1.97], [2.0, 2.42], [3.0, 2.86], [3.0, 4.26], [4.0, 11.91], [14.0, 14.13], [14.0, 36.27], [48.0, 48.37], [51.0, 52.68], [54.0, 57.18], [62.0, 62.63], [70.0, 73.87], [75.0, 80.11]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 35.88, 0.0, 0.0, 60.51, 0.0, 39.25, 38.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 31.47], ["livestock, farm animals, working animals", 13.03], ["hum", 12.31]], null, [["music", 49.69], ["musical instrument", 13.78], ["didgeridoo", 4.93]], null, null, null, null, [["music", 71.8], ["boing", 4.84], ["musical instrument", 3.57]], [["music", 64.8], ["musical instrument", 7.16], ["brass instrument", 6.94]]], "duration": [0.63, -0.33, 0.97, 0.42, -0.14, 1.26, 7.91, 0.13, 22.27, 0.37, 1.68, 3.18, 0.63, 3.87, 5.11]} \ No newline at end of file diff --git a/annotations_filtered/hy0b9Rz31Zs_filtered.json b/annotations_filtered/hy0b9Rz31Zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54c3fd86692fdda261796e3fcab783baa67b6af9 --- /dev/null +++ b/annotations_filtered/hy0b9Rz31Zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.08], [5.0, 16.65], [18.0, 18.44], [20.0, 23.79], [24.0, 27.4], [28.0, 29.35], [30.0, 31.7], [33.0, 37.52], [39.0, 42.62], [43.0, 46.04], [47.0, 50.26], [51.0, 53.54], [55.0, 59.78], [61.0, 63.39], [64.0, 67.14], [68.0, 68.59], [69.0, 80.67], [82.0, 84.75], [88.0, 90.15], [91.0, 92.4], [93.0, 93.04], [94.0, 95.18], [97.0, 97.17], [98.0, 100.21], [101.0, 107.99], [116.0, 127.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [44.9, 87.19, 0.0, 85.72, 48.23, 0.0, 0.0, 60.23, 75.39, 36.58, 89.36, 93.6, 62.17, 81.71, 46.57, 0.0, 88.28, 87.55, 56.18, 0.0, 0.0, 0.0, 0.0, 48.48, 35.44, 30.15], "audiomae_on_audioset": [[["speech", 22.06], ["sidetone", 19.96], ["mains hum", 5.66]], null, null, null, [["tuning fork", 35.13], ["sine wave", 27.27], ["speech", 10.99]], null, null, null, null, [["speech", 55.48], ["hum", 10.69], ["sidetone", 4.19]], null, null, null, null, [["speech", 54.54], ["sine wave", 16.67], ["tuning fork", 8.64]], null, null, null, null, null, null, null, null, [["sidetone", 23.6], ["music", 18.2], ["hum", 8.15]], [["hum", 32.8], ["music", 29.34], ["theremin", 9.21]], [["theremin", 84.78], ["music", 10.93], ["synthesizer", 1.02]]], "duration": [2.08, 11.65, 0.44, 3.79, 3.4, 1.35, 1.7, 4.52, 3.62, 3.04, 3.26, 2.54, 4.78, 2.39, 3.14, 0.59, 11.67, 2.75, 2.15, 1.4, 0.04, 1.18, 0.17, 2.21, 6.99, 11.87]} \ No newline at end of file diff --git a/annotations_filtered/hyXCJXsHX3A_filtered.json b/annotations_filtered/hyXCJXsHX3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3982f790f37ca0165e935e11b5eb7e843cdacf27 --- /dev/null +++ b/annotations_filtered/hyXCJXsHX3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.9], [10.0, 10.29], [12.0, 12.16], [14.0, 14.28], [18.0, 18.17], [25.0, 26.79], [34.0, 35.7], [40.0, 40.27], [42.0, 42.74], [44.0, 45.1], [46.0, 46.8], [49.0, 58.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 0.29, 0.16, 0.28, 0.17, 1.79, 1.7, 0.27, 0.74, 1.1, 0.8, 9.04]} \ No newline at end of file diff --git a/annotations_filtered/hzV5qSWRfKY_filtered.json b/annotations_filtered/hzV5qSWRfKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a482e1efb9c7c7ffd1654d0df75ef640fde78ef0 --- /dev/null +++ b/annotations_filtered/hzV5qSWRfKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 23.06], [29.0, 30.48], [31.0, 32.02], [32.0, 37.37], [39.0, 45.13], [46.0, 46.31], [48.0, 47.82], [50.0, 50.3], [52.0, 54.77], [57.0, 60.25], [61.0, 62.01], [64.0, 65.84], [66.0, 66.7], [68.0, 68.08], [68.0, 77.97], [79.0, 79.15], [80.0, 80.37], [81.0, 80.91], [89.0, 89.29], [92.0, 92.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.92, 0.0, 0.0, 75.88, 80.29, 0.0, 0.0, 0.0, 94.66, 86.82, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.06, 1.48, 1.02, 5.37, 6.13, 0.31, -0.18, 0.3, 2.77, 3.25, 1.01, 1.84, 0.7, 0.08, 9.97, 0.15, 0.37, -0.09, 0.29, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/hzmZJcPlJlE_filtered.json b/annotations_filtered/hzmZJcPlJlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1d1ef8c8576d0bd6bc850e243b80dfe5fc52c8 --- /dev/null +++ b/annotations_filtered/hzmZJcPlJlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [12.0, 15.25], [16.0, 24.11], [25.0, 25.81], [28.0, 29.98], [32.0, 32.0], [33.0, 33.47], [34.0, 43.16], [48.0, 52.37], [55.0, 55.07], [56.0, 56.86], [58.0, 107.42], [110.0, 123.47], [127.0, 132.17], [135.0, 142.15], [144.0, 148.24], [155.0, 156.09], [158.0, 159.0], [161.0, 164.42]], "keep_status": [false, true, true, false, false, false, false, true, true, false, false, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 29.61, 33.93, 0.0, 0.0, 0.0, 0.0, 28.54, 29.25, 0.0, 0.0, 0.0, 28.34, 29.25, 28.78, 28.87, 0.0, 0.0, 29.61], "audiomae_on_audioset": [null, [["sound effect", 16.12], ["speech", 10.61], ["echo", 9.85]], [["music", 29.24], ["noise", 9.61], ["buzz", 7.5]], null, null, null, null, [["music", 12.68], ["fly, housefly", 12.58], ["mosquito", 10.96]], [["foghorn", 36.99], ["theremin", 11.83], ["music", 9.95]], null, null, null, [["speech", 14.55], ["music", 13.34], ["buzz", 9.68]], [["music", 69.45], ["speech", 5.01], ["animal", 3.07]], [["music", 19.2], ["pulse", 6.21], ["sound effect", 5.88]], [["music", 39.21], ["hum", 6.98], ["musical instrument", 6.66]], null, null, [["foghorn", 24.99], ["music", 17.64], ["trombone", 16.74]]], "duration": [0.94, 3.25, 8.11, 0.81, 1.98, 0.0, 0.47, 9.16, 4.37, 0.07, 0.86, 49.42, 13.47, 5.17, 7.15, 4.24, 1.09, 1.0, 3.42]} \ No newline at end of file