diff --git a/annotations_filtered/j-47cwN0w_c_filtered.json b/annotations_filtered/j-47cwN0w_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..158b87632a841f8e064ec3cecc6c444126e0b1ec --- /dev/null +++ b/annotations_filtered/j-47cwN0w_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.23], [13.0, 15.7], [17.0, 19.74], [21.0, 24.26], [25.0, 30.0], [32.0, 37.56], [39.0, 80.72], [81.0, 83.93], [85.0, 84.94]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [98.59, 99.1, 99.21, 92.31, 94.37, 97.11, 0.0, 51.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [5.23, 2.7, 2.74, 3.26, 5.0, 5.56, 41.72, 2.93, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/j-7pVks8avo_filtered.json b/annotations_filtered/j-7pVks8avo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2639ad4e822d856c5089d1953a4e5205274ca7d7 --- /dev/null +++ b/annotations_filtered/j-7pVks8avo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.42], [16.0, 16.11], [38.0, 38.35], [41.0, 40.88], [47.0, 47.71], [51.0, 52.22], [57.0, 57.01], [63.0, 63.95], [66.0, 66.7], [67.0, 67.49], [77.0, 77.94], [84.0, 84.82], [132.0, 132.09], [133.0, 133.44], [144.0, 145.03], [146.0, 147.39], [148.0, 152.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.47], ["radio", 24.87], ["speech", 19.64]]], "duration": [0.42, 0.11, 0.35, -0.12, 0.71, 1.22, 0.01, 0.95, 0.7, 0.49, 0.94, 0.82, 0.09, 0.44, 1.03, 1.39, 4.31]} \ No newline at end of file diff --git a/annotations_filtered/j-OcaLECz1k_filtered.json b/annotations_filtered/j-OcaLECz1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a884c826e45ecae9ab3e86e86da966b3bca8491 --- /dev/null +++ b/annotations_filtered/j-OcaLECz1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [9.0, 10.47], [12.0, 12.21], [15.0, 17.39], [24.0, 26.28], [31.0, 34.38], [39.0, 40.42], [42.0, 43.31], [49.0, 50.13], [54.0, 55.63], [56.0, 57.92], [59.0, 59.86], [63.0, 66.07], [67.0, 69.36], [71.0, 72.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.97, 96.66, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.47, 0.21, 2.39, 2.28, 3.38, 1.42, 1.31, 1.13, 1.63, 1.92, 0.86, 3.07, 2.36, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/j-TPDJFWErg_filtered.json b/annotations_filtered/j-TPDJFWErg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ce7f027cb48f9c66f689496c2ec31dc41b5765 --- /dev/null +++ b/annotations_filtered/j-TPDJFWErg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [5.0, 8.53], [12.0, 12.51], [14.0, 55.49], [57.0, 62.99], [63.0, 64.15], [65.0, 70.8], [71.0, 72.03], [73.0, 74.29], [75.0, 81.58], [84.0, 92.01], [96.0, 120.68], [123.0, 136.92], [138.0, 138.38], [141.0, 141.17], [143.0, 145.2], [146.0, 146.5], [147.0, 148.44], [149.0, 151.01], [151.0, 152.79], [153.0, 160.17], [162.0, 163.51], [164.0, 167.59], [168.0, 170.78], [171.0, 172.52], [173.0, 174.04]], "keep_status": [false, false, false, false, true, false, true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.81, 0.0, 0.0, 33.3, 0.0, 34.98, 0.0, 0.0, 34.14, 32.26, 34.07, 33.98, 0.0, 0.0, 63.1, 0.0, 0.0, 74.44, 0.0, 51.6, 0.0, 63.64, 79.24, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.52], ["speech", 21.63], ["animal", 1.21]], null, null, [["music", 27.81], ["noise", 14.59], ["theremin", 8.23]], null, [["speech", 22.75], ["music", 19.09], ["noise", 10.49]], null, null, [["music", 17.3], ["noise", 16.54], ["speech", 13.02]], [["music", 38.99], ["smash, crash", 14.07], ["whack, thwack", 9.83]], [["music", 54.57], ["speech", 20.23], ["throbbing", 8.14]], [["music", 41.43], ["throbbing", 11.01], ["hum", 10.99]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 3.53, 0.51, 41.49, 5.99, 1.15, 5.8, 1.03, 1.29, 6.58, 8.01, 24.68, 13.92, 0.38, 0.17, 2.2, 0.5, 1.44, 2.01, 1.79, 7.17, 1.51, 3.59, 2.78, 1.52, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/j-V12tL78Mc_filtered.json b/annotations_filtered/j-V12tL78Mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38e2d3cb7ff66854f449861187112f6606b2a154 --- /dev/null +++ b/annotations_filtered/j-V12tL78Mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.77], [24.0, 44.98], [46.0, 68.12], [74.0, 78.36], [80.0, 82.7], [87.0, 87.27], [88.0, 89.02], [90.0, 91.44], [93.0, 93.24], [95.0, 96.33], [97.0, 100.95], [106.0, 107.7], [108.0, 109.0], [110.0, 120.06], [120.0, 120.11], [121.0, 121.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.63, 70.86, 36.02, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 62.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 16.24], ["speech", 14.0], ["hum", 13.38]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 20.98, 22.12, 4.36, 2.7, 0.27, 1.02, 1.44, 0.24, 1.33, 3.95, 1.7, 1.0, 10.06, 0.11, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/j-dYZPMpoqI_filtered.json b/annotations_filtered/j-dYZPMpoqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ab1cc052d6bbe1f6067b2337929d005d53a945 --- /dev/null +++ b/annotations_filtered/j-dYZPMpoqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.45], [28.0, 32.97], [35.0, 43.11], [44.0, 43.95], [44.0, 177.79], [178.0, 184.27], [185.0, 186.19], [188.0, 188.67]], "keep_status": [false, true, true, false, false, false, false, false], "silence_prob": [28.49, 32.58, 28.54, 0.0, 0.0, 86.82, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.8], ["throbbing", 20.37], ["smash, crash", 8.71]], [["hum", 27.42], ["mains hum", 23.46], ["music", 16.45]], [["music", 58.54], ["cacophony", 5.39], ["smash, crash", 4.97]], null, null, null, null, null], "duration": [4.45, 4.97, 8.11, -0.05, 133.79, 6.27, 1.19, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/j-v6XtJFNQE_filtered.json b/annotations_filtered/j-v6XtJFNQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26d6d6519d33810ba3a8b50a49e718d05c1567a3 --- /dev/null +++ b/annotations_filtered/j-v6XtJFNQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [13.0, 16.24], [18.0, 19.57], [21.0, 24.0], [27.0, 27.45], [31.0, 32.66], [35.0, 38.6], [40.0, 40.42], [42.0, 41.67], [46.0, 46.8], [50.0, 52.24], [55.0, 81.06], [82.0, 83.37], [85.0, 86.71], [87.0, 87.72], [90.0, 90.69], [91.0, 91.86], [93.0, 94.41], [99.0, 118.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.54, 0.0, 94.22, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 60.32, 41.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.68], ["explosion", 14.41], ["fly, housefly", 7.36]], null, null, null, null, null, null, null], "duration": [0.44, 3.24, 1.57, 3.0, 0.45, 1.66, 3.6, 0.42, -0.33, 0.8, 2.24, 26.06, 1.37, 1.71, 0.72, 0.69, 0.86, 1.41, 19.74]} \ No newline at end of file diff --git a/annotations_filtered/j0IXQIUh3jQ_filtered.json b/annotations_filtered/j0IXQIUh3jQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/j0IXQIUh3jQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/j0c_RQDfjSM_filtered.json b/annotations_filtered/j0c_RQDfjSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d791adac4962f9c273399a74b2152edddd6920dc --- /dev/null +++ b/annotations_filtered/j0c_RQDfjSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [6.0, 6.1], [14.0, 13.91], [18.0, 18.57], [23.0, 23.28], [24.0, 24.95], [35.0, 35.65], [38.0, 38.97], [42.0, 42.77], [46.0, 47.56], [52.0, 52.51], [57.0, 57.18], [63.0, 63.04], [63.0, 63.91], [65.0, 66.43], [68.0, 68.96], [69.0, 81.09], [82.0, 83.37], [84.0, 84.94], [88.0, 88.96], [93.0, 100.36], [102.0, 108.38], [110.0, 121.05], [121.0, 121.17], [121.0, 136.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.63, 0.0, 0.0, 0.0, 29.35, 29.12, 29.18, 0.0, 30.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 88.64], ["boing", 4.79], ["speech", 1.66]], null, null, null, [["music", 82.08], ["fly, housefly", 2.34], ["sidetone", 1.7]], [["music", 50.23], ["didgeridoo", 15.0], ["hum", 3.49]], [["music", 62.88], ["electric shaver, electric razor", 9.88], ["electronic music", 3.1]], null, [["music", 88.33], ["throbbing", 1.83], ["speech", 1.33]]], "duration": [1.82, 0.1, -0.09, 0.57, 0.28, 0.95, 0.65, 0.97, 0.77, 1.56, 0.51, 0.18, 0.04, 0.91, 1.43, 0.96, 12.09, 1.37, 0.94, 0.96, 7.36, 6.38, 11.05, 0.17, 15.71]} \ No newline at end of file diff --git a/annotations_filtered/j0cqqCpIZHE_filtered.json b/annotations_filtered/j0cqqCpIZHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09f0fb70bc35010ddd106faa10b54eab7f103c3e --- /dev/null +++ b/annotations_filtered/j0cqqCpIZHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [6.0, 7.32], [11.0, 11.77], [26.0, 25.89], [26.0, 26.0], [26.0, 26.18], [26.0, 26.22], [26.0, 26.45], [26.0, 27.18], [27.0, 27.23], [28.0, 28.59], [30.0, 30.18], [32.0, 33.52], [35.0, 35.34], [40.0, 44.71], [45.0, 46.23], [48.0, 48.51], [50.0, 50.23], [54.0, 54.55], [60.0, 67.51], [69.0, 70.73], [72.0, 72.93], [75.0, 77.4], [79.0, 81.04], [88.0, 88.48], [89.0, 90.41], [97.0, 97.56], [98.0, 98.36], [99.0, 99.84], [115.0, 115.32], [118.0, 118.84], [120.0, 120.51], [122.0, 123.74], [125.0, 126.1], [127.0, 128.46], [135.0, 136.81], [138.0, 140.12], [141.0, 143.63], [144.0, 147.7], [149.0, 150.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.35, 0.0, 0.0, 0.0, 0.0, 30.6, 0.0, 0.0, 40.55, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 57.89, 50.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.82], ["mains hum", 8.46], ["hum", 6.42]], null, null, null, null, [["speech", 67.69], ["music", 12.28], ["breaking", 2.32]], null, null, [["music", 55.71], ["didgeridoo", 8.39], ["hum", 6.08]], [["music", 35.96], ["musical instrument", 5.33], ["vehicle", 3.29]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.76], ["speech", 24.3], ["theremin", 16.26]], null, null, null], "duration": [0.4, 1.32, 0.77, -0.11, 0.0, 0.18, 0.22, 0.45, 1.18, 0.23, 0.59, 0.18, 1.52, 0.34, 4.71, 1.23, 0.51, 0.23, 0.55, 7.51, 1.73, 0.93, 2.4, 2.04, 0.48, 1.41, 0.56, 0.36, 0.84, 0.32, 0.84, 0.51, 1.74, 1.1, 1.46, 1.81, 2.12, 2.63, 3.7, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/j0iplsU1qa4_filtered.json b/annotations_filtered/j0iplsU1qa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3aef6da62c77721baa8e3032eb9f03575fc9bad --- /dev/null +++ b/annotations_filtered/j0iplsU1qa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [7.0, 7.25], [8.0, 8.68], [13.0, 14.0], [21.0, 21.47], [24.0, 24.54], [26.0, 30.47], [32.0, 34.74], [36.0, 45.22], [50.0, 50.35], [52.0, 53.16], [56.0, 58.01], [59.0, 60.79], [61.0, 62.68], [68.0, 68.39], [73.0, 73.41], [77.0, 80.32], [81.0, 81.19], [86.0, 86.68], [88.0, 88.57], [90.0, 97.31], [98.0, 102.96], [103.0, 104.21], [108.0, 108.87], [114.0, 114.35], [115.0, 119.45], [120.0, 120.97], [123.0, 126.47], [128.0, 129.83], [132.0, 133.69], [135.0, 137.15], [138.0, 138.97], [140.0, 141.24], [145.0, 145.94], [152.0, 153.55], [155.0, 155.88], [157.0, 157.96], [159.0, 159.92], [164.0, 164.73]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.22, 53.1, 28.98, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 30.69, 30.38, 0.0, 0.0, 0.0, 28.81, 0.0, 34.07, 0.0, 0.0, 31.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 32.17], ["music", 16.16], ["throbbing", 13.5]], null, [["hum", 46.09], ["mains hum", 17.32], ["whale vocalization", 8.72]], null, null, [["music", 14.26], ["hum", 13.45], ["mains hum", 9.15]], null, null, null, null, [["hum", 35.76], ["mains hum", 24.92], ["throbbing", 6.9]], null, null, null, [["hum", 29.61], ["fly, housefly", 11.37], ["bee, wasp, etc.", 10.02]], [["bee, wasp, etc.", 36.47], ["insect", 16.69], ["fly, housefly", 14.32]], null, null, null, [["speech", 63.13], ["music", 5.4], ["rumble", 3.59]], null, [["music", 18.39], ["hum", 15.08], ["speech", 11.99]], null, null, [["noise", 29.61], ["white noise", 10.44], ["hum", 8.41]], null, null, null, null, null, null, null, null], "duration": [1.04, 0.25, 0.68, 1.0, 0.47, 0.54, 4.47, 2.74, 9.22, 0.35, 1.16, 2.01, 1.79, 1.68, 0.39, 0.41, 3.32, 0.19, 0.68, 0.57, 7.31, 4.96, 1.21, 0.87, 0.35, 4.45, 0.97, 3.47, 1.83, 1.69, 2.15, 0.97, 1.24, 0.94, 1.55, 0.88, 0.96, 0.92, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/j0sbjGj7ONo_filtered.json b/annotations_filtered/j0sbjGj7ONo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0d673304810073b1a6de8728eb972ca739bd31c --- /dev/null +++ b/annotations_filtered/j0sbjGj7ONo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.62], [14.0, 20.04], [21.0, 21.88], [30.0, 38.55], [40.0, 40.37], [42.0, 51.48], [52.0, 61.67], [63.0, 63.85], [65.0, 74.12], [75.0, 76.33], [79.0, 80.82], [82.0, 83.78], [85.0, 87.49], [88.0, 88.99], [91.0, 95.59], [97.0, 98.64], [104.0, 112.02], [113.0, 115.99], [117.0, 119.45], [123.0, 127.04]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.72, 57.89, 0.0, 48.91, 0.0, 42.17, 39.09, 0.0, 32.96, 0.0, 0.0, 0.0, 79.76, 0.0, 69.47, 0.0, 81.17, 58.81, 70.72, 67.25], "audiomae_on_audioset": [null, null, null, [["music", 32.16], ["speech", 12.31], ["fly, housefly", 11.53]], null, [["speech", 30.92], ["music", 25.19], ["insect", 8.66]], [["music", 33.78], ["speech", 25.99], ["theremin", 11.72]], null, [["gunshot, gunfire", 12.5], ["thunk", 10.18], ["music", 8.19]], null, null, null, null, null, null, null, null, null, null, null], "duration": [8.62, 6.04, 0.88, 8.55, 0.37, 9.48, 9.67, 0.85, 9.12, 1.33, 1.82, 1.78, 2.49, 0.99, 4.59, 1.64, 8.02, 2.99, 2.45, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/j0silSyYFPM_filtered.json b/annotations_filtered/j0silSyYFPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef58175d035a3fcddcfd69368b93c8075a20eb0a --- /dev/null +++ b/annotations_filtered/j0silSyYFPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.95], [11.0, 13.81], [17.0, 17.44], [22.0, 22.82], [26.0, 28.11], [31.0, 31.16], [34.0, 35.77], [39.0, 42.47], [43.0, 46.48], [50.0, 50.75], [53.0, 54.19], [58.0, 59.64], [63.0, 65.25], [66.0, 66.73], [70.0, 70.46], [74.0, 74.01], [75.0, 76.49], [78.0, 79.15], [82.0, 82.21], [85.0, 86.75], [92.0, 97.88], [99.0, 102.51], [104.0, 104.82], [106.0, 108.41]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [41.93, 39.27, 0.0, 0.0, 42.67, 0.0, 0.0, 44.52, 39.07, 0.0, 0.0, 0.0, 45.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.5, 43.4, 0.0, 36.77], "audiomae_on_audioset": [[["theremin", 39.84], ["music", 25.84], ["hum", 6.3]], [["music", 56.47], ["hum", 7.86], ["mains hum", 6.01]], null, null, [["hum", 14.32], ["music", 10.87], ["throbbing", 8.56]], null, null, [["music", 33.73], ["hum", 16.43], ["mains hum", 6.03]], [["hum", 44.41], ["mains hum", 28.82], ["whale vocalization", 4.04]], null, null, null, [["music", 40.12], ["hum", 10.22], ["didgeridoo", 9.89]], null, null, null, null, null, null, null, [["music", 38.09], ["singing bowl", 12.06], ["speech", 8.22]], [["theremin", 41.14], ["music", 21.26], ["hum", 7.34]], null, [["speech", 45.79], ["didgeridoo", 24.99], ["music", 8.53]]], "duration": [2.95, 2.81, 0.44, 0.82, 2.11, 0.16, 1.77, 3.47, 3.48, 0.75, 1.19, 1.64, 2.25, 0.73, 0.46, 0.01, 1.49, 1.15, 0.21, 1.75, 5.88, 3.51, 0.82, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/j0z0V2JJ5II_filtered.json b/annotations_filtered/j0z0V2JJ5II_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2292ed294fb524e35f407c67c0d2c41f6f01047 --- /dev/null +++ b/annotations_filtered/j0z0V2JJ5II_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.32], [1.0, 1.36], [1.0, 1.39], [1.0, 1.43], [2.0, 1.53], [3.0, 13.76], [17.0, 18.12], [21.0, 21.32], [26.0, 44.07], [46.0, 54.48], [56.0, 70.04], [71.0, 73.8], [76.0, 79.56], [80.0, 94.05], [95.0, 101.24], [108.0, 110.78], [113.0, 121.59]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.76, 0.0, 0.0, 38.6, 31.11, 35.96, 40.9, 63.1, 38.49, 33.13, 30.14, 30.44], "audiomae_on_audioset": [null, null, null, null, null, [["music", 24.18], ["sidetone", 22.43], ["throbbing", 14.22]], null, null, [["hum", 27.49], ["throbbing", 16.24], ["mains hum", 11.34]], [["music", 49.98], ["noise", 20.77], ["grunt", 6.91]], [["grunt", 49.69], ["noise", 19.04], ["groan", 16.39]], [["sidetone", 49.17], ["speech", 26.68], ["radio", 6.35]], null, [["insect", 40.06], ["fly, housefly", 28.57], ["music", 9.94]], [["music", 49.71], ["theremin", 6.06], ["musical instrument", 4.44]], [["cattle, bovinae", 38.42], ["moo", 31.73], ["speech", 9.58]], [["speech", 46.58], ["electric shaver, electric razor", 10.67], ["hum", 10.19]]], "duration": [0.32, 0.36, 0.39, 0.43, -0.47, 10.76, 1.12, 0.32, 18.07, 8.48, 14.04, 2.8, 3.56, 14.05, 6.24, 2.78, 8.59]} \ No newline at end of file diff --git a/annotations_filtered/j19-hpjJ4ok_filtered.json b/annotations_filtered/j19-hpjJ4ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cc1567df4d9e31c30e015a12761bbaefe1586f5 --- /dev/null +++ b/annotations_filtered/j19-hpjJ4ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.94], [14.0, 14.77], [16.0, 17.44], [18.0, 18.3], [20.0, 20.51], [21.0, 21.81], [26.0, 27.99], [33.0, 33.18], [36.0, 36.31], [37.0, 37.72], [39.0, 40.36], [41.0, 46.63], [48.0, 50.14], [60.0, 61.75], [62.0, 63.9], [71.0, 72.13], [74.0, 77.52], [81.0, 81.23], [82.0, 82.7], [86.0, 86.49], [89.0, 89.43], [90.0, 90.8], [94.0, 95.42], [97.0, 97.77], [98.0, 99.08], [126.0, 128.22], [132.0, 132.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 84.25, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 65.88], ["fly, housefly", 4.66], ["insect", 4.28]], null], "duration": [0.94, 0.77, 1.44, 0.3, 0.51, 0.81, 1.99, 0.18, 0.31, 0.72, 1.36, 5.63, 2.14, 1.75, 1.9, 1.13, 3.52, 0.23, 0.7, 0.49, 0.43, 0.8, 1.42, 0.77, 1.08, 2.22, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/j1C0Tw80Fgk_filtered.json b/annotations_filtered/j1C0Tw80Fgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc6cf1cf3b127c601a5ffb1d9712c247e9b800e5 --- /dev/null +++ b/annotations_filtered/j1C0Tw80Fgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.76], [8.0, 8.34], [10.0, 10.86], [12.0, 13.39], [24.0, 25.27], [26.0, 29.61], [37.0, 39.28], [40.0, 41.96], [44.0, 44.66], [45.0, 46.35], [50.0, 50.43], [53.0, 55.73], [57.0, 58.36], [68.0, 74.83], [75.0, 75.86], [77.0, 77.89], [78.0, 83.03], [88.0, 87.98], [93.0, 92.64], [94.0, 98.49], [103.0, 104.53], [111.0, 111.4], [120.0, 120.78], [133.0, 134.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 99.44, 0.0, 0.0, 0.0, 0.0, 42.96, 0.0, 61.67, 0.0, 0.0, 43.35, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 28.93], ["dial tone", 26.59], ["sine wave", 9.95]], null, null, null, null, [["speech", 83.12], ["telephone", 2.36], ["inside, small room", 2.01]], null, null, null, null, null, null, null], "duration": [-0.24, 0.34, 0.86, 1.39, 1.27, 3.61, 2.28, 1.96, 0.66, 1.35, 0.43, 2.73, 1.36, 6.83, 0.86, 0.89, 5.03, -0.02, -0.36, 4.49, 1.53, 0.4, 0.78, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/j1VL-y9JHuI_filtered.json b/annotations_filtered/j1VL-y9JHuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff0b38c126ef21260fd9754e530006ab067ee0bf --- /dev/null +++ b/annotations_filtered/j1VL-y9JHuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.43], [23.0, 29.08], [35.0, 37.56], [43.0, 46.47], [47.0, 48.2], [57.0, 56.79], [58.0, 58.48], [64.0, 63.91], [65.0, 70.09], [74.0, 74.49], [76.0, 79.79], [84.0, 96.11], [99.0, 99.77], [105.0, 105.73], [107.0, 109.59], [110.0, 110.84], [116.0, 116.13], [117.0, 121.1], [125.0, 138.23]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, true, false, false, true, false, false, true, false], "silence_prob": [0.0, 30.96, 30.46, 30.49, 0.0, 0.0, 0.0, 0.0, 31.88, 0.0, 30.36, 29.44, 0.0, 0.0, 30.4, 0.0, 0.0, 31.08, 32.92], "audiomae_on_audioset": [null, [["music", 60.55], ["musical instrument", 4.89], ["fireworks", 3.62]], [["music", 50.83], ["musical instrument", 21.31], ["drum", 9.16]], [["music", 70.29], ["musical instrument", 2.17], ["mains hum", 1.91]], null, null, null, null, [["music", 19.08], ["fly, housefly", 17.55], ["insect", 10.62]], null, [["music", 42.99], ["synthetic singing", 4.08], ["speech", 3.75]], [["explosion", 24.34], ["burst, pop", 19.28], ["speech", 16.65]], null, null, [["music", 34.11], ["mains hum", 11.84], ["hum", 9.15]], null, null, [["music", 57.71], ["didgeridoo", 5.42], ["musical instrument", 4.01]], [["music", 70.23], ["vocal music", 5.36], ["singing", 3.98]]], "duration": [0.43, 6.08, 2.56, 3.47, 1.2, -0.21, 0.48, -0.09, 5.09, 0.49, 3.79, 12.11, 0.77, 0.73, 2.59, 0.84, 0.13, 4.1, 13.23]} \ No newline at end of file diff --git a/annotations_filtered/j1q-QWHUU0g_filtered.json b/annotations_filtered/j1q-QWHUU0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b962ebfb4c543cda5eb8b65ed249f470acc38581 --- /dev/null +++ b/annotations_filtered/j1q-QWHUU0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [12.0, 26.25], [29.0, 33.81], [36.0, 37.39], [41.0, 44.09], [45.0, 46.13], [53.0, 52.74], [56.0, 56.59], [58.0, 58.99], [61.0, 62.72], [64.0, 64.47], [64.0, 64.57], [65.0, 64.61], [69.0, 69.6], [74.0, 74.55], [76.0, 77.57], [81.0, 80.96], [81.0, 81.75], [88.0, 88.84], [91.0, 92.58], [94.0, 95.77], [96.0, 97.26], [107.0, 107.86], [110.0, 111.15], [117.0, 118.99], [131.0, 133.05], [141.0, 141.02], [142.0, 143.33], [144.0, 146.53]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.11, 32.04, 0.0, 32.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.41, 0.0, 0.0, 35.69], "audiomae_on_audioset": [null, [["whale vocalization", 22.81], ["music", 14.93], ["theremin", 9.51]], [["music", 43.4], ["speech", 13.54], ["crowd", 3.96]], null, [["music", 12.62], ["boat, water vehicle", 10.73], ["foghorn", 7.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 60.68], ["music", 22.9], ["musical instrument", 2.42]], null, null, [["music", 51.15], ["theremin", 30.79], ["musical instrument", 4.88]]], "duration": [0.67, 14.25, 4.81, 1.39, 3.09, 1.13, -0.26, 0.59, 0.99, 1.72, 0.47, 0.57, -0.39, 0.6, 0.55, 1.57, -0.04, 0.75, 0.84, 1.58, 1.77, 1.26, 0.86, 1.15, 1.99, 2.05, 0.02, 1.33, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/j1tXIl0snEk_filtered.json b/annotations_filtered/j1tXIl0snEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2c4473114cdb61fd52a020d255226838828477b --- /dev/null +++ b/annotations_filtered/j1tXIl0snEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.95], [27.0, 28.29], [30.0, 30.65], [33.0, 34.35], [36.0, 36.75], [39.0, 45.69], [47.0, 48.17], [56.0, 57.4], [73.0, 77.48], [83.0, 83.83], [100.0, 101.58], [105.0, 116.6], [118.0, 121.09]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, true, true], "silence_prob": [29.46, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0, 28.69, 0.0, 0.0, 30.37, 30.08], "audiomae_on_audioset": [[["hum", 55.57], ["throbbing", 19.32], ["mains hum", 13.19]], null, null, null, null, [["hum", 28.02], ["music", 20.58], ["throbbing", 17.62]], null, null, [["hum", 35.29], ["mains hum", 22.22], ["music", 9.84]], null, null, [["music", 34.68], ["electronic music", 8.95], ["speech", 6.93]], [["hum", 36.85], ["ambient music", 17.32], ["music", 12.99]]], "duration": [5.95, 1.29, 0.65, 1.35, 0.75, 6.69, 1.17, 1.4, 4.48, 0.83, 1.58, 11.6, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/j1tkwdfz7n4_filtered.json b/annotations_filtered/j1tkwdfz7n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c499c90a3dfd300105fb7aa5a18cb043fc021965 --- /dev/null +++ b/annotations_filtered/j1tkwdfz7n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.72], [19.0, 20.7], [25.0, 26.96], [28.0, 27.95], [29.0, 30.23], [33.0, 33.34], [34.0, 35.29], [43.0, 43.92], [44.0, 57.05], [88.0, 92.28], [95.0, 94.74], [101.0, 103.25], [114.0, 116.55], [117.0, 120.78], [121.0, 128.75]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.25, 33.58, 0.0, 38.86, 34.68, 33.83, 35.33], "audiomae_on_audioset": [[["music", 33.44], ["thunk", 16.36], ["whack, thwack", 11.28]], null, null, null, null, null, null, null, [["music", 79.11], ["speech", 7.67], ["musical instrument", 2.79]], [["music", 61.02], ["musical instrument", 8.02], ["synthesizer", 4.96]], null, [["music", 71.26], ["musical instrument", 7.49], ["didgeridoo", 3.7]], [["music", 50.37], ["didgeridoo", 5.69], ["hum", 3.72]], [["music", 73.65], ["speech", 9.2], ["musical instrument", 2.96]], [["music", 69.34], ["throbbing", 6.25], ["hum", 4.3]]], "duration": [2.72, 1.7, 1.96, -0.05, 1.23, 0.34, 1.29, 0.92, 13.05, 4.28, -0.26, 2.25, 2.55, 3.78, 7.75]} \ No newline at end of file diff --git a/annotations_filtered/j21idqW08wU_filtered.json b/annotations_filtered/j21idqW08wU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50e1c32ea39da6e66b66438c1eb6ecad62d7b2bd --- /dev/null +++ b/annotations_filtered/j21idqW08wU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 33.86], [35.0, 35.4], [40.0, 46.55], [50.0, 50.79], [52.0, 61.74], [64.0, 70.83], [73.0, 86.04], [101.0, 114.15], [115.0, 115.57], [117.0, 122.72], [128.0, 128.39], [129.0, 130.15], [134.0, 135.38], [136.0, 137.0], [141.0, 141.02], [142.0, 146.31], [152.0, 156.84], [161.0, 161.97], [167.0, 172.66], [173.0, 174.9]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.22, 0.0, 32.6, 0.0, 34.22, 33.96, 34.56, 33.99, 0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 63.64, 0.0, 35.58, 0.0], "audiomae_on_audioset": [[["music", 44.84], ["speech", 19.84], ["throbbing", 10.25]], null, [["music", 37.8], ["speech", 26.58], ["hum", 4.77]], null, [["music", 51.83], ["speech", 21.56], ["hum", 5.21]], [["music", 37.02], ["hum", 18.68], ["mains hum", 12.15]], [["hum", 38.0], ["throbbing", 18.42], ["music", 18.25]], [["speech", 32.13], ["buzz", 25.72], ["vehicle", 9.6]], null, [["hum", 22.53], ["music", 22.48], ["mains hum", 21.9]], null, null, null, null, null, [["speech", 40.96], ["music", 17.52], ["hum", 6.61]], null, null, [["speech", 57.15], ["music", 7.3], ["rumble", 3.78]], null], "duration": [19.86, 0.4, 6.55, 0.79, 9.74, 6.83, 13.04, 13.15, 0.57, 5.72, 0.39, 1.15, 1.38, 1.0, 0.02, 4.31, 4.84, 0.97, 5.66, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/j2JFTz9KQhk_filtered.json b/annotations_filtered/j2JFTz9KQhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d64d5ff58e67ee36dff1cbc5f5dc33cacf1ad403 --- /dev/null +++ b/annotations_filtered/j2JFTz9KQhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.85], [14.0, 32.04], [37.0, 38.26], [40.0, 47.98], [50.0, 51.44], [53.0, 63.09], [63.0, 72.32], [73.0, 73.28], [74.0, 74.26], [77.0, 83.13], [84.0, 85.21], [86.0, 88.89], [90.0, 93.21], [94.0, 94.24], [96.0, 98.51], [99.0, 99.13], [101.0, 101.21], [103.0, 102.76], [109.0, 109.29], [123.0, 124.5], [129.0, 130.23], [133.0, 132.68], [137.0, 137.13], [138.0, 139.68]], "keep_status": [false, true, false, true, false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.72, 0.0, 34.88, 0.0, 32.09, 30.54, 0.0, 0.0, 32.85, 0.0, 30.19, 31.94, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.43], ["throbbing", 8.11], ["hum", 5.67]], null, [["music", 23.4], ["throbbing", 15.32], ["hum", 5.86]], null, [["fly, housefly", 29.84], ["insect", 18.46], ["mosquito", 17.36]], [["hum", 23.12], ["speech", 20.18], ["music", 19.81]], null, null, [["hum", 49.85], ["music", 19.37], ["throbbing", 17.11]], null, [["hum", 27.64], ["music", 15.93], ["throbbing", 15.17]], [["vehicle", 17.77], ["music", 16.51], ["hum", 10.52]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 18.04, 1.26, 7.98, 1.44, 10.09, 9.32, 0.28, 0.26, 6.13, 1.21, 2.89, 3.21, 0.24, 2.51, 0.13, 0.21, -0.24, 0.29, 1.5, 1.23, -0.32, 0.13, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/j2MbvFYy_8Y_filtered.json b/annotations_filtered/j2MbvFYy_8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4723294235a641e7c067252076d81aa7efbe2d5 --- /dev/null +++ b/annotations_filtered/j2MbvFYy_8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [11.0, 11.23], [13.0, 13.32], [15.0, 14.91], [19.0, 22.06], [26.0, 26.81], [29.0, 29.73], [31.0, 48.03], [48.0, 48.44], [50.0, 49.92], [54.0, 58.48], [64.0, 65.43], [67.0, 67.42], [69.0, 69.74], [73.0, 75.02], [76.0, 76.79], [77.0, 78.19], [81.0, 82.22], [83.0, 83.86], [86.0, 91.67], [94.0, 98.02], [99.0, 99.57], [101.0, 101.43], [102.0, 102.41], [104.0, 105.19], [119.0, 119.31], [120.0, 121.04], [122.0, 123.08], [125.0, 141.0], [144.0, 155.76]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.71, 0.0, 0.0, 30.07, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 73.06, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.68, 32.52], "audiomae_on_audioset": [null, null, null, null, [["music", 51.0], ["musical instrument", 7.89], ["percussion", 4.2]], null, null, [["music", 27.78], ["noise", 15.02], ["mains hum", 9.2]], null, null, [["breaking", 22.9], ["crushing", 14.49], ["thunk", 12.59]], null, null, null, [["sidetone", 46.67], ["speech", 41.12], ["echo", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.85], ["musical instrument", 6.8], ["effects unit", 2.0]], [["music", 62.93], ["speech", 11.34], ["guitar", 3.87]]], "duration": [0.86, 0.23, 0.32, -0.09, 3.06, 0.81, 0.73, 17.03, 0.44, -0.08, 4.48, 1.43, 0.42, 0.74, 2.02, 0.79, 1.19, 1.22, 0.86, 5.67, 4.02, 0.57, 0.43, 0.41, 1.19, 0.31, 1.04, 1.08, 16.0, 11.76]} \ No newline at end of file diff --git a/annotations_filtered/j2SPawJewxA_filtered.json b/annotations_filtered/j2SPawJewxA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc259c278064704c00d55637518f2fc148caa14 --- /dev/null +++ b/annotations_filtered/j2SPawJewxA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 74.93], [76.0, 115.6], [117.0, 119.15], [121.0, 120.83]], "keep_status": [false, false, true, false], "silence_prob": [38.45, 0.0, 35.93, 0.0], "audiomae_on_audioset": [[["music", 52.92], ["speech", 13.5], ["fart", 11.26]], null, [["speech", 14.62], ["music", 11.49], ["crowd", 8.18]], null], "duration": [21.93, 39.6, 2.15, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/j2ZsEQ4Fr4c_filtered.json b/annotations_filtered/j2ZsEQ4Fr4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c49880a9fad71d77fc1a6f5cd1717e22e5d7be4 --- /dev/null +++ b/annotations_filtered/j2ZsEQ4Fr4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.19], [41.0, 40.78], [73.0, 73.43], [77.0, 78.02], [79.0, 80.74], [82.0, 83.66], [87.0, 87.07], [88.0, 89.29], [90.0, 92.2], [93.0, 93.02], [94.0, 95.57], [96.0, 98.54], [99.0, 100.67]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 77.36, 0.0], "audiomae_on_audioset": [[["speech", 22.34], ["music", 17.83], ["mosquito", 11.07]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.19, -0.22, 0.43, 1.02, 1.74, 1.66, 0.07, 1.29, 2.2, 0.02, 1.57, 2.54, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/j2aGGNQW_7M_filtered.json b/annotations_filtered/j2aGGNQW_7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..408622515e7421a5aea58622e3f7bedd53983f4a --- /dev/null +++ b/annotations_filtered/j2aGGNQW_7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.72], [9.0, 10.23], [11.0, 11.13], [12.0, 13.76], [15.0, 19.01], [23.0, 24.7], [26.0, 36.66], [37.0, 38.21], [39.0, 59.1], [59.0, 62.23], [63.0, 82.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 97.64, 0.0, 92.8, 99.73, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 1.23, 0.13, 1.76, 4.01, 1.7, 10.66, 1.21, 20.1, 3.23, 19.9]} \ No newline at end of file diff --git a/annotations_filtered/j2e41FeccuA_filtered.json b/annotations_filtered/j2e41FeccuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b8a33c33df87c78ac6f81c06b5ad70805ef1346 --- /dev/null +++ b/annotations_filtered/j2e41FeccuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [15.0, 15.58], [17.0, 17.81], [18.0, 25.27], [26.0, 26.94], [33.0, 35.48], [40.0, 45.3], [46.0, 52.41], [53.0, 54.16], [55.0, 56.57], [64.0, 65.25], [67.0, 67.86], [68.0, 69.47], [72.0, 77.06], [78.0, 79.37], [82.0, 82.56], [84.0, 85.41], [89.0, 90.66], [92.0, 93.23], [94.0, 95.27], [97.0, 97.17], [99.0, 101.8], [103.0, 106.73], [109.0, 109.7], [111.0, 114.42], [115.0, 116.53], [120.0, 127.5]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.83, 0.0, 34.62, 31.17, 29.72, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 38.82, 0.0, 37.89, 0.0, 33.55], "audiomae_on_audioset": [null, null, null, [["music", 32.12], ["speech", 24.97], ["theremin", 5.18]], null, [["music", 25.81], ["noise", 9.46], ["fart", 4.69]], [["music", 27.64], ["throbbing", 22.04], ["hum", 19.6]], [["speech", 38.79], ["music", 26.93], ["fart", 9.93]], null, null, null, null, null, [["music", 54.18], ["synthesizer", 5.8], ["musical instrument", 4.04]], null, null, null, null, null, null, null, [["music", 61.7], ["musical instrument", 4.71], ["guitar", 3.5]], [["music", 66.9], ["ambient music", 6.15], ["electronic music", 5.04]], null, [["music", 44.39], ["hum", 12.9], ["speech", 6.54]], null, [["theremin", 43.09], ["music", 36.81], ["synthesizer", 6.0]]], "duration": [1.11, 0.58, 0.81, 7.27, 0.94, 2.48, 5.3, 6.41, 1.16, 1.57, 1.25, 0.86, 1.47, 5.06, 1.37, 0.56, 1.41, 1.66, 1.23, 1.27, 0.17, 2.8, 3.73, 0.7, 3.42, 1.53, 7.5]} \ No newline at end of file diff --git a/annotations_filtered/j32LbrHGak0_filtered.json b/annotations_filtered/j32LbrHGak0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..814f8e6d0f2b830b072543cb6750a0ee0be200b2 --- /dev/null +++ b/annotations_filtered/j32LbrHGak0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.53], [22.0, 26.94], [28.0, 28.11]], "keep_status": [false, false, false], "silence_prob": [0.0, 32.39, 0.0], "audiomae_on_audioset": [null, [["music", 38.57], ["hum", 17.1], ["throbbing", 16.0]], null], "duration": [1.53, 4.94, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/j38t2lDi4GU_filtered.json b/annotations_filtered/j38t2lDi4GU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dc08b43fa1228eda2fe1afe1667983b06a91533 --- /dev/null +++ b/annotations_filtered/j38t2lDi4GU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.01], [31.0, 32.44], [37.0, 47.31], [48.0, 47.76], [48.0, 47.8], [49.0, 53.37], [60.0, 59.76], [67.0, 69.11], [70.0, 70.95], [73.0, 78.07], [78.0, 78.12], [79.0, 82.92], [87.0, 102.24], [103.0, 136.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 0.0, 31.57, 0.0, 35.9, 0.0, 33.86, 0.0, 34.48, 33.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.62], ["theremin", 16.34], ["musical instrument", 4.35]], null, null, [["music", 70.21], ["theremin", 13.05], ["musical instrument", 2.06]], null, [["music", 46.78], ["theremin", 14.38], ["didgeridoo", 13.67]], null, [["music", 63.28], ["ambient music", 8.94], ["synthesizer", 3.88]], null, [["music", 69.04], ["ambient music", 4.92], ["synthesizer", 3.93]], [["music", 77.75], ["ambient music", 6.04], ["electronic music", 2.7]], null], "duration": [0.01, 1.44, 10.31, -0.24, -0.2, 4.37, -0.24, 2.11, 0.95, 5.07, 0.12, 3.92, 15.24, 33.61]} \ No newline at end of file diff --git a/annotations_filtered/j3MZdcbv-ew_filtered.json b/annotations_filtered/j3MZdcbv-ew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45a20131fecdaeafa8cc819aa1d8481584d5cd18 --- /dev/null +++ b/annotations_filtered/j3MZdcbv-ew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.74], [42.0, 42.69], [44.0, 44.49], [49.0, 48.93], [52.0, 52.25], [76.0, 76.92], [85.0, 85.09], [88.0, 89.04], [95.0, 95.74], [98.0, 98.54], [101.0, 101.92], [118.0, 117.98], [118.0, 118.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 0.69, 0.49, -0.07, 0.25, 0.92, 0.09, 1.04, 0.74, 0.54, 0.92, -0.02, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/j3d3mrWBTpM_filtered.json b/annotations_filtered/j3d3mrWBTpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f25a08b20140f3b46b24e220dffa0ebcb8d58643 --- /dev/null +++ b/annotations_filtered/j3d3mrWBTpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [6.0, 7.05], [8.0, 8.78], [11.0, 11.43], [12.0, 13.66], [14.0, 16.12], [18.0, 19.33], [21.0, 21.95], [23.0, 24.6], [25.0, 27.73], [32.0, 33.69], [34.0, 35.51], [40.0, 40.24], [42.0, 42.72], [45.0, 46.57], [49.0, 50.89], [54.0, 54.65], [60.0, 60.32], [62.0, 61.87], [62.0, 61.97], [62.0, 62.02], [62.0, 62.09], [62.0, 62.18], [63.0, 75.24], [76.0, 77.9], [79.0, 80.13], [82.0, 82.8], [88.0, 88.8], [89.0, 90.9], [93.0, 93.46], [96.0, 98.24], [101.0, 101.36], [103.0, 103.23], [105.0, 106.69], [109.0, 110.25], [111.0, 113.64], [118.0, 118.5], [120.0, 121.68], [126.0, 125.69], [128.0, 129.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 1.05, 0.78, 0.43, 1.66, 2.12, 1.33, 0.95, 1.6, 2.73, 1.69, 1.51, 0.24, 0.72, 1.57, 1.89, 0.65, 0.32, -0.13, -0.03, 0.02, 0.09, 0.18, 12.24, 1.9, 1.13, 0.8, 0.8, 1.9, 0.46, 2.24, 0.36, 0.23, 1.69, 1.25, 2.64, 0.5, 1.68, -0.31, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/j40IcG_BZuc_filtered.json b/annotations_filtered/j40IcG_BZuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff3fdc93bbaf16123e01a8526fb2672d03a2d4b1 --- /dev/null +++ b/annotations_filtered/j40IcG_BZuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [8.0, 9.46], [15.0, 29.34], [30.0, 41.96], [45.0, 45.59], [46.0, 46.33], [47.0, 50.41], [54.0, 56.07], [56.0, 56.81], [57.0, 69.62], [81.0, 90.19], [91.0, 91.32], [94.0, 100.58], [108.0, 118.3], [119.0, 124.78], [125.0, 125.81], [127.0, 127.52], [129.0, 137.19], [137.0, 138.0], [139.0, 141.05], [142.0, 142.06], [147.0, 148.31], [149.0, 149.84], [150.0, 151.53], [152.0, 153.06], [154.0, 155.19], [156.0, 164.64]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.82, 47.5, 0.0, 0.0, 36.12, 64.52, 0.0, 40.88, 48.56, 0.0, 29.67, 30.03, 31.82, 0.0, 0.0, 37.24, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.67], "audiomae_on_audioset": [null, null, [["hum", 50.78], ["throbbing", 16.57], ["mains hum", 12.27]], [["hum", 30.44], ["speech", 17.26], ["mains hum", 14.99]], null, null, [["mains hum", 31.04], ["hum", 16.8], ["music", 14.31]], null, null, [["music", 55.17], ["speech", 11.98], ["theremin", 9.81]], [["mains hum", 62.29], ["hum", 23.57], ["music", 3.57]], null, [["music", 46.67], ["brass instrument", 18.33], ["musical instrument", 9.87]], [["didgeridoo", 37.11], ["music", 32.96], ["theremin", 11.93]], [["music", 61.67], ["musical instrument", 7.05], ["didgeridoo", 6.5]], null, null, [["music", 34.49], ["theremin", 33.11], ["musical instrument", 6.17]], null, [["music", 23.71], ["civil defense siren", 14.64], ["theremin", 11.9]], null, null, null, null, null, null, [["music", 56.46], ["theremin", 15.24], ["musical instrument", 3.57]]], "duration": [1.17, 1.46, 14.34, 11.96, 0.59, 0.33, 3.41, 2.07, 0.81, 12.62, 9.19, 0.32, 6.58, 10.3, 5.78, 0.81, 0.52, 8.19, 1.0, 2.05, 0.06, 1.31, 0.84, 1.53, 1.06, 1.19, 8.64]} \ No newline at end of file diff --git a/annotations_filtered/j42TrAVceCI_filtered.json b/annotations_filtered/j42TrAVceCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/j42TrAVceCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/j477dAxaeck_filtered.json b/annotations_filtered/j477dAxaeck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40382801975a8716347ef09f5ae04b001e96e8d8 --- /dev/null +++ b/annotations_filtered/j477dAxaeck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.05], [28.0, 30.89], [32.0, 32.85], [35.0, 35.95], [38.0, 39.01], [42.0, 41.84], [44.0, 46.89], [48.0, 48.47], [49.0, 49.06], [53.0, 54.67], [60.0, 61.2], [62.0, 62.24], [70.0, 69.94], [71.0, 72.94], [74.0, 98.59], [99.0, 102.3], [106.0, 106.35], [107.0, 107.11], [119.0, 119.3], [122.0, 122.17], [124.0, 125.85], [129.0, 130.79], [132.0, 132.53], [136.0, 137.32], [143.0, 144.81], [145.0, 145.91], [150.0, 151.04], [151.0, 152.83], [166.0, 166.55], [167.0, 168.34], [169.0, 171.54], [174.0, 177.08], [177.0, 178.34], [179.0, 179.24], [180.0, 179.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.19, 94.66, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.43, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 23.73], ["whack, thwack", 20.65], ["music", 8.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.05, 2.89, 0.85, 0.95, 1.01, -0.16, 2.89, 0.47, 0.06, 1.67, 1.2, 0.24, -0.06, 1.94, 24.59, 3.3, 0.35, 0.11, 0.3, 0.17, 1.85, 1.79, 0.53, 1.32, 1.81, 0.91, 1.04, 1.83, 0.55, 1.34, 2.54, 3.08, 1.34, 0.24, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/j4onAJ-3FAM_filtered.json b/annotations_filtered/j4onAJ-3FAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89184e3c218aaee5a07f776bcf927dd61f172acd --- /dev/null +++ b/annotations_filtered/j4onAJ-3FAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [5.0, 4.94], [5.0, 7.65], [8.0, 7.86], [8.0, 8.01], [9.0, 8.56], [10.0, 9.63], [11.0, 24.88], [28.0, 36.85], [43.0, 52.2], [52.0, 54.19], [55.0, 60.15], [61.0, 77.97], [79.0, 83.86]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 0.0, 32.68, 0.0, 0.0, 0.0, 0.0, 31.84, 32.89, 33.3, 40.38, 30.89, 29.1, 29.22], "audiomae_on_audioset": [null, null, [["music", 59.93], ["speech", 10.05], ["electronic music", 6.49]], null, null, null, null, [["throbbing", 33.85], ["hum", 27.74], ["music", 25.22]], [["music", 39.41], ["throbbing", 18.43], ["fart", 5.85]], [["music", 46.49], ["throbbing", 23.09], ["hum", 15.45]], [["music", 74.41], ["throbbing", 11.33], ["hum", 2.95]], [["music", 49.95], ["speech", 7.65], ["electronic music", 4.5]], [["music", 44.19], ["throbbing", 13.42], ["buzz", 10.64]], [["explosion", 30.12], ["whack, thwack", 10.38], ["music", 5.6]]], "duration": [0.44, -0.06, 2.65, -0.14, 0.01, -0.44, -0.37, 13.88, 8.85, 9.2, 2.19, 5.15, 16.97, 4.86]} \ No newline at end of file diff --git a/annotations_filtered/j4ujHOSbQB0_filtered.json b/annotations_filtered/j4ujHOSbQB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8909d335492b15b01229c3e0f9049b8a7fddcd2f --- /dev/null +++ b/annotations_filtered/j4ujHOSbQB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.65], [43.0, 43.29], [46.0, 45.89], [47.0, 47.29], [49.0, 49.32], [54.0, 54.24], [56.0, 56.49], [58.0, 60.42], [61.0, 63.36], [71.0, 70.75], [78.0, 83.22], [84.0, 85.72], [87.0, 87.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 50.61, 0.0, 72.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.29, -0.11, 0.29, 0.32, 0.24, 0.49, 2.42, 2.36, -0.25, 5.22, 1.72, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/j4yXEmQRq34_filtered.json b/annotations_filtered/j4yXEmQRq34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bad4278f20da5c89ef6c72286866e921415f1420 --- /dev/null +++ b/annotations_filtered/j4yXEmQRq34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [3.0, 3.37], [7.0, 7.59], [9.0, 9.76], [10.0, 11.69], [15.0, 16.29], [23.0, 23.25], [26.0, 26.42], [27.0, 28.27], [29.0, 29.32], [30.0, 31.33], [39.0, 39.87], [43.0, 48.76], [51.0, 52.34], [53.0, 56.3], [61.0, 61.67], [66.0, 67.22], [68.0, 69.28], [71.0, 71.07], [71.0, 73.7], [75.0, 89.45], [92.0, 94.34], [97.0, 103.81], [105.0, 107.05], [112.0, 146.65], [147.0, 147.88], [150.0, 150.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.51, 0.0, 43.38, 0.0, 0.0, 0.0, 0.0, 52.05, 43.15, 34.83, 78.38, 90.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 51.06], ["hum", 34.65], ["speech", 4.96]], null, null, null, null, null, [["speech", 42.36], ["animal", 28.15], ["stomach rumble", 7.58]], [["music", 25.38], ["effects unit", 19.25], ["noise", 11.07]], null, null, null, null, null], "duration": [0.49, 0.37, 0.59, 0.76, 1.69, 1.29, 0.25, 0.42, 1.27, 0.32, 1.33, 0.87, 5.76, 1.34, 3.3, 0.67, 1.22, 1.28, 0.07, 2.7, 14.45, 2.34, 6.81, 2.05, 34.65, 0.88, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/j5B70NEq_fY_filtered.json b/annotations_filtered/j5B70NEq_fY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4dfebad2b915a287a0a8f19ecb9e5efffedb240 --- /dev/null +++ b/annotations_filtered/j5B70NEq_fY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.94], [13.0, 13.0], [13.0, 14.03], [18.0, 19.94], [22.0, 22.49], [26.0, 26.28], [30.0, 31.26], [33.0, 34.72], [37.0, 38.21], [46.0, 51.24], [55.0, 56.83], [59.0, 62.56], [63.0, 64.86], [66.0, 69.28], [70.0, 71.04], [72.0, 72.84], [85.0, 89.97], [91.0, 96.25]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.1, 0.0, 30.67, 0.0, 31.79, 0.0, 0.0, 91.64, 31.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 17.69], ["hum", 12.59], ["music", 7.05]], null, [["speech", 28.15], ["crowd", 14.51], ["cheering", 13.03]], null, [["music", 57.36], ["crackle", 3.23], ["applause", 2.92]], null, null, null, [["music", 63.04], ["musical instrument", 4.46], ["echo", 2.07]]], "duration": [-0.06, 0.0, 1.03, 1.94, 0.49, 0.28, 1.26, 1.72, 1.21, 5.24, 1.83, 3.56, 1.86, 3.28, 1.04, 0.84, 4.97, 5.25]} \ No newline at end of file diff --git a/annotations_filtered/j5Fd6TqePnk_filtered.json b/annotations_filtered/j5Fd6TqePnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..640037b731f0b383d5dffc7a5547bf677efe2bf9 --- /dev/null +++ b/annotations_filtered/j5Fd6TqePnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [4.0, 5.09], [7.0, 8.73], [10.0, 12.88], [14.0, 14.34], [15.0, 19.18], [19.0, 22.11], [23.0, 31.65], [33.0, 34.3], [36.0, 40.41], [42.0, 43.44], [45.0, 45.0], [45.0, 48.32], [49.0, 51.97], [53.0, 56.96], [58.0, 62.4], [63.0, 63.49], [65.0, 65.43], [67.0, 69.28], [72.0, 75.61], [80.0, 81.87], [84.0, 86.61], [88.0, 93.56], [95.0, 97.75], [99.0, 101.93], [106.0, 108.73], [110.0, 114.0], [117.0, 120.58], [125.0, 128.26], [130.0, 132.88], [134.0, 135.48], [137.0, 137.89], [139.0, 142.8], [144.0, 145.29], [147.0, 148.56], [149.0, 156.68], [157.0, 156.95]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, true, true, true, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 39.64, 0.0, 40.62, 35.05, 35.59, 0.0, 88.1, 0.0, 0.0, 30.89, 56.93, 44.96, 47.2, 0.0, 0.0, 71.29, 72.75, 0.0, 53.59, 68.02, 53.65, 42.81, 37.63, 48.14, 41.89, 41.44, 73.82, 0.0, 0.0, 44.93, 0.0, 0.0, 34.83, 0.0], "audiomae_on_audioset": [null, null, null, [["throbbing", 19.27], ["hum", 15.55], ["heart sounds, heartbeat", 9.61]], null, [["speech", 33.49], ["sidetone", 10.89], ["radio", 9.15]], [["fart", 26.61], ["music", 22.76], ["effects unit", 6.35]], [["speech", 23.5], ["noise", 21.12], ["radio", 16.37]], null, null, null, null, [["speech", 29.75], ["radio", 21.07], ["music", 9.38]], null, [["radio", 20.97], ["speech", 18.87], ["noise", 3.78]], [["hum", 36.02], ["mains hum", 11.44], ["burping, eructation", 9.43]], null, null, null, null, null, null, null, null, [["fly, housefly", 13.73], ["hum", 12.61], ["whale vocalization", 11.54]], [["burping, eructation", 8.53], ["hum", 6.87], ["growling", 6.83]], [["dog", 18.44], ["bow-wow", 15.65], ["animal", 14.61]], [["hum", 40.22], ["inside, small room", 7.39], ["mains hum", 7.02]], [["dog", 35.09], ["domestic animals, pets", 15.36], ["animal", 10.45]], null, null, null, [["creak", 17.58], ["hum", 9.14], ["mains hum", 5.81]], null, null, [["theremin", 20.2], ["whale vocalization", 18.58], ["hum", 13.89]], null], "duration": [0.81, 1.09, 1.73, 2.88, 0.34, 4.18, 3.11, 8.65, 1.3, 4.41, 1.44, 0.0, 3.32, 2.97, 3.96, 4.4, 0.49, 0.43, 2.28, 3.61, 1.87, 2.61, 5.56, 2.75, 2.93, 2.73, 4.0, 3.58, 3.26, 2.88, 1.48, 0.89, 3.8, 1.29, 1.56, 7.68, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/j638xTM36I8_filtered.json b/annotations_filtered/j638xTM36I8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fda554209bec9cab0aa6f29cc18fcd4fa2ea1247 --- /dev/null +++ b/annotations_filtered/j638xTM36I8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 30.5], [31.0, 88.25], [90.0, 91.79], [94.0, 95.22], [97.0, 98.96], [100.0, 101.73], [103.0, 103.25], [106.0, 105.83], [106.0, 107.64], [108.0, 108.95], [110.0, 110.49], [111.0, 111.86], [112.0, 113.43], [114.0, 114.44], [115.0, 115.84], [116.0, 117.51]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.44], ["speech", 15.07], ["horse", 5.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [29.5, 57.25, 1.79, 1.22, 1.96, 1.73, 0.25, -0.17, 1.64, 0.95, 0.49, 0.86, 1.43, 0.44, 0.84, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/j66Fsl_q5Ig_filtered.json b/annotations_filtered/j66Fsl_q5Ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d803ebec844b67b00447dc13a0639572b69c517 --- /dev/null +++ b/annotations_filtered/j66Fsl_q5Ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.04], [19.0, 21.76], [23.0, 23.36], [25.0, 25.95], [28.0, 29.08], [32.0, 34.87], [38.0, 38.04], [39.0, 53.35], [59.0, 59.98], [63.0, 74.9], [76.0, 90.21], [92.0, 94.04], [99.0, 99.98], [102.0, 105.02], [106.0, 107.05], [111.0, 112.13], [113.0, 113.7], [115.0, 115.48], [119.0, 142.5], [146.0, 151.43], [154.0, 166.62], [168.0, 198.41]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [31.03, 43.58, 0.0, 0.0, 0.0, 31.17, 0.0, 31.2, 0.0, 30.56, 30.17, 32.12, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 30.91, 31.26, 30.95, 0.0], "audiomae_on_audioset": [[["music", 41.92], ["throbbing", 19.18], ["hum", 9.42]], [["music", 68.98], ["synthesizer", 3.41], ["musical instrument", 2.98]], null, null, null, [["speech", 22.66], ["music", 21.91], ["eruption", 3.77]], null, [["music", 56.6], ["electronic music", 6.76], ["cacophony", 4.1]], null, [["music", 38.69], ["speech", 25.57], ["hum", 4.62]], [["mains hum", 34.69], ["music", 24.04], ["hum", 16.33]], [["music", 33.04], ["hum", 8.99], ["throbbing", 8.05]], null, [["music", 52.22], ["hum", 6.57], ["cacophony", 5.99]], null, null, null, null, [["music", 55.75], ["throbbing", 14.39], ["hum", 10.11]], [["music", 36.34], ["throbbing", 20.42], ["hum", 12.54]], [["music", 46.95], ["speech", 26.96], ["electric shaver, electric razor", 2.43]], null], "duration": [5.04, 2.76, 0.36, 0.95, 1.08, 2.87, 0.04, 14.35, 0.98, 11.9, 14.21, 2.04, 0.98, 3.02, 1.05, 1.13, 0.7, 0.48, 23.5, 5.43, 12.62, 30.41]} \ No newline at end of file diff --git a/annotations_filtered/j6_umKYN_JU_filtered.json b/annotations_filtered/j6_umKYN_JU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abf603ce2f8dd6a3b0d334b1766a42419be793d0 --- /dev/null +++ b/annotations_filtered/j6_umKYN_JU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.36], [50.0, 49.87], [50.0, 50.8], [106.0, 114.94], [119.0, 122.99], [126.0, 130.33]], "keep_status": [false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 33.2, 28.87, 29.21], "audiomae_on_audioset": [null, null, null, [["music", 37.73], ["speech", 30.94], ["livestock, farm animals, working animals", 5.76]], [["music", 22.72], ["boom", 16.14], ["smash, crash", 7.83]], [["music", 21.45], ["explosion", 18.67], ["fart", 7.73]]], "duration": [0.36, -0.13, 0.8, 8.94, 3.99, 4.33]} \ No newline at end of file diff --git a/annotations_filtered/j6gLJ4_sfG8_filtered.json b/annotations_filtered/j6gLJ4_sfG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67de6ba6c219ef124fe09bd9132d0042ac5eabb6 --- /dev/null +++ b/annotations_filtered/j6gLJ4_sfG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 35.7], [37.0, 61.03], [63.0, 65.33], [67.0, 69.43], [72.0, 75.17], [78.0, 78.9], [80.0, 82.7], [84.0, 90.78], [92.0, 93.53], [95.0, 95.4], [97.0, 98.27], [100.0, 101.38], [102.0, 103.67], [105.0, 107.87], [111.0, 126.33]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.76, 48.56, 47.98, 53.53, 71.43, 0.0, 82.61, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 69.2], "audiomae_on_audioset": [[["mains hum", 25.83], ["hum", 25.76], ["music", 12.91]], [["music", 25.96], ["fly, housefly", 13.68], ["bee, wasp, etc.", 8.28]], [["speech", 29.94], ["music", 15.06], ["throbbing", 5.91]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.7, 24.03, 2.33, 2.43, 3.17, 0.9, 2.7, 6.78, 1.53, 0.4, 1.27, 1.38, 1.67, 2.87, 15.33]} \ No newline at end of file diff --git a/annotations_filtered/j6oBbBfhgYE_filtered.json b/annotations_filtered/j6oBbBfhgYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e4724cff17fc534050e7f94fcb53ea8ccfb233d --- /dev/null +++ b/annotations_filtered/j6oBbBfhgYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.12], [4.0, 3.89], [5.0, 7.64], [18.0, 18.39], [19.0, 21.34], [23.0, 27.38], [30.0, 30.79], [34.0, 42.79], [43.0, 44.64]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.86, 0.0, 89.19, 61.18, 0.0, 36.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 89.83], ["meow", 1.43], ["speech synthesizer", 1.42]], null], "duration": [1.12, -0.11, 2.64, 0.39, 2.34, 4.38, 0.79, 8.79, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/j6oHprwdTeA_filtered.json b/annotations_filtered/j6oHprwdTeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efa558c2dd105177de9513ee3800f363ae63b167 --- /dev/null +++ b/annotations_filtered/j6oHprwdTeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.58], [16.0, 16.9], [17.0, 19.03], [21.0, 21.57], [31.0, 32.21], [38.0, 37.81], [38.0, 39.11], [41.0, 40.69], [44.0, 44.52], [49.0, 48.81], [49.0, 50.01], [53.0, 54.68], [56.0, 56.24], [57.0, 57.13], [65.0, 65.96], [77.0, 80.74], [82.0, 83.54], [89.0, 89.41], [96.0, 99.81], [103.0, 103.11]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 41.03, 0.0], "audiomae_on_audioset": [null, null, [["speech", 47.85], ["sidetone", 10.12], ["radio", 4.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.52], ["throbbing", 17.09], ["synthesizer", 8.84]], null], "duration": [1.58, 0.9, 2.03, 0.57, 1.21, -0.19, 1.11, -0.31, 0.52, -0.19, 1.01, 1.68, 0.24, 0.13, 0.96, 3.74, 1.54, 0.41, 3.81, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/j6qjibwpEzM_filtered.json b/annotations_filtered/j6qjibwpEzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b7c8f384d2681a5064a0b8e7b146ef2227d08f8 --- /dev/null +++ b/annotations_filtered/j6qjibwpEzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [5.0, 5.76], [7.0, 7.37], [13.0, 13.22], [23.0, 22.86], [31.0, 31.11], [32.0, 32.51], [34.0, 34.03], [37.0, 37.44], [38.0, 38.87], [43.0, 43.55], [51.0, 54.7], [88.0, 89.34], [119.0, 119.26], [124.0, 128.09], [130.0, 130.32], [139.0, 139.28], [176.0, 176.49], [177.0, 177.35], [192.0, 193.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.99, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["clang", 25.92], ["speech", 19.74], ["firecracker", 10.41]], null, null, [["music", 79.67], ["boing", 10.04], ["marimba, xylophone", 2.18]], null, null, null, null, null], "duration": [0.79, 0.76, 0.37, 0.22, -0.14, 0.11, 0.51, 0.03, 0.44, 0.87, 0.55, 3.7, 1.34, 0.26, 4.09, 0.32, 0.28, 0.49, 0.35, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/j71oHN1i2pU_filtered.json b/annotations_filtered/j71oHN1i2pU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85e96644f3fecfb6ef412ddd8ab38d16e595f6ea --- /dev/null +++ b/annotations_filtered/j71oHN1i2pU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.98], [29.0, 29.34], [30.0, 30.45], [31.0, 31.48], [32.0, 35.43], [38.0, 38.5], [55.0, 66.9], [67.0, 68.82], [70.0, 82.27], [86.0, 85.95], [89.0, 108.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.08, 0.0, 28.95, 0.0, 31.53, 0.0, 29.8], "audiomae_on_audioset": [null, null, null, null, [["music", 14.46], ["grunt", 14.01], ["groan", 13.98]], null, [["music", 65.78], ["speech", 4.59], ["hum", 4.4]], null, [["music", 48.5], ["speech", 19.42], ["foghorn", 4.17]], null, [["livestock, farm animals, working animals", 41.39], ["cattle, bovinae", 12.81], ["moo", 8.54]]], "duration": [-0.02, 0.34, 0.45, 0.48, 3.43, 0.5, 11.9, 1.82, 12.27, -0.05, 19.94]} \ No newline at end of file diff --git a/annotations_filtered/j7O-SUEh-54_filtered.json b/annotations_filtered/j7O-SUEh-54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9285cd0ec7be0081fc91d8235697d1d3f776f2a2 --- /dev/null +++ b/annotations_filtered/j7O-SUEh-54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.74], [8.0, 8.92], [10.0, 10.56], [11.0, 11.58], [13.0, 13.71], [15.0, 15.97], [17.0, 17.64], [19.0, 23.7], [25.0, 25.52], [26.0, 27.77], [28.0, 29.02], [30.0, 30.67], [31.0, 32.22], [33.0, 35.13], [36.0, 36.14], [40.0, 40.19], [41.0, 41.52], [42.0, 48.49], [49.0, 50.13], [51.0, 52.1], [54.0, 55.95], [62.0, 68.64], [70.0, 70.68], [74.0, 75.95], [79.0, 80.59], [83.0, 83.39], [85.0, 84.96], [86.0, 86.36], [96.0, 96.43], [97.0, 98.1], [101.0, 102.32], [105.0, 105.8], [109.0, 109.44], [112.0, 112.56], [122.0, 126.76], [127.0, 127.53], [132.0, 132.92], [134.0, 135.03], [137.0, 140.78], [145.0, 150.03], [154.0, 154.57], [158.0, 158.72], [166.0, 166.48], [166.0, 168.66], [170.0, 173.5], [179.0, 179.76], [180.0, 181.8], [183.0, 184.05], [185.0, 185.18], [188.0, 188.06], [192.0, 193.41], [195.0, 195.44], [198.0, 203.81], [205.0, 209.9], [221.0, 220.67], [221.0, 222.52], [224.0, 225.39], [229.0, 236.55], [237.0, 239.09], [240.0, 241.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 36.13, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.42, 0.0, 0.0, 0.0, 42.55, 39.93, 0.0, 0.0, 0.0, 35.77, 41.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 31.97, 0.0, 0.0, 0.0, 36.61, 36.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.93], ["groan", 2.59], ["quack", 2.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.09], ["whale vocalization", 11.94], ["whack, thwack", 11.7]], null, null, null, [["fly, housefly", 47.17], ["insect", 13.97], ["speech", 10.92]], [["speech", 20.14], ["radio", 17.62], ["music", 12.36]], null, null, null, [["speech", 81.45], ["radio", 2.69], ["gunshot, gunfire", 0.9]], [["speech", 63.63], ["music", 4.12], ["hum", 2.92]], null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.73], ["fly, housefly", 11.84], ["moo", 10.3]], [["whale vocalization", 24.28], ["livestock, farm animals, working animals", 19.1], ["cattle, bovinae", 17.72]], null, null, null, [["hum", 34.78], ["mains hum", 19.88], ["throbbing", 8.19]], [["music", 30.24], ["whale vocalization", 12.02], ["speech", 4.57]], null], "duration": [0.74, 0.92, 0.56, 0.58, 0.71, 0.97, 0.64, 4.7, 0.52, 1.77, 1.02, 0.67, 1.22, 2.13, 0.14, 0.19, 0.52, 6.49, 1.13, 1.1, 1.95, 6.64, 0.68, 1.95, 1.59, 0.39, -0.04, 0.36, 0.43, 1.1, 1.32, 0.8, 0.44, 0.56, 4.76, 0.53, 0.92, 1.03, 3.78, 5.03, 0.57, 0.72, 0.48, 2.66, 3.5, 0.76, 1.8, 1.05, 0.18, 0.06, 1.41, 0.44, 5.81, 4.9, -0.33, 1.52, 1.39, 7.55, 2.09, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/j7PgnjEiMcA_filtered.json b/annotations_filtered/j7PgnjEiMcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3022dee8d69e42a9f84068d5aa7008d43456ad0 --- /dev/null +++ b/annotations_filtered/j7PgnjEiMcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [7.0, 7.15], [10.0, 19.72], [25.0, 28.36], [33.0, 39.04], [42.0, 45.99], [47.0, 47.83], [53.0, 53.55], [60.0, 60.47], [65.0, 65.15], [68.0, 68.52], [70.0, 79.12], [79.0, 96.65], [98.0, 103.22], [105.0, 105.36], [106.0, 116.7], [123.0, 123.23], [132.0, 134.79], [135.0, 136.7], [140.0, 146.21], [150.0, 150.63]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [33.45, 0.0, 36.65, 37.52, 36.06, 37.99, 0.0, 0.0, 0.0, 0.0, 0.0, 35.51, 35.53, 35.65, 0.0, 31.34, 0.0, 38.46, 0.0, 33.94, 0.0], "audiomae_on_audioset": [[["music", 36.3], ["theremin", 11.42], ["musical instrument", 11.24]], null, [["music", 70.44], ["musical instrument", 5.88], ["keyboard (musical)", 2.0]], [["music", 34.98], ["didgeridoo", 11.97], ["musical instrument", 7.56]], [["music", 69.36], ["musical instrument", 6.01], ["percussion", 1.76]], [["music", 75.28], ["musical instrument", 4.33], ["theremin", 3.57]], null, null, null, null, null, [["music", 74.18], ["musical instrument", 4.34], ["theremin", 3.3]], [["music", 60.71], ["musical instrument", 7.24], ["double bass", 4.86]], [["music", 55.22], ["didgeridoo", 7.45], ["musical instrument", 5.03]], null, [["music", 69.13], ["music of latin america", 3.49], ["musical instrument", 3.41]], null, [["music", 51.95], ["didgeridoo", 17.17], ["guitar", 6.3]], null, [["music", 48.43], ["musical instrument", 5.83], ["flamenco", 5.23]], null], "duration": [2.08, 0.15, 9.72, 3.36, 6.04, 3.99, 0.83, 0.55, 0.47, 0.15, 0.52, 9.12, 17.65, 5.22, 0.36, 10.7, 0.23, 2.79, 1.7, 6.21, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/j7m47I9BuuY_filtered.json b/annotations_filtered/j7m47I9BuuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3300fae37101dd5d7c47a91e925ae7c9a8980f60 --- /dev/null +++ b/annotations_filtered/j7m47I9BuuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[209.0, 214.22]], "keep_status": [false], "silence_prob": [60.89], "audiomae_on_audioset": [null], "duration": [5.22]} \ No newline at end of file diff --git a/annotations_filtered/j84y65YfUS4_filtered.json b/annotations_filtered/j84y65YfUS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..151b5b9744cb95278e82e93c41ce1346fc5a64c6 --- /dev/null +++ b/annotations_filtered/j84y65YfUS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [12.0, 13.09], [15.0, 15.89], [17.0, 28.48], [29.0, 36.58], [38.0, 39.18], [43.0, 44.04], [45.0, 47.39], [49.0, 49.32], [52.0, 52.27], [53.0, 56.4], [58.0, 58.14], [62.0, 65.16], [66.0, 67.07], [72.0, 72.69], [73.0, 78.9], [82.0, 85.83], [87.0, 86.98], [88.0, 88.6], [92.0, 91.84], [94.0, 113.58], [115.0, 131.92]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.01, 33.53, 0.0, 0.0, 40.77, 0.0, 0.0, 65.79, 0.0, 73.67, 0.0, 0.0, 33.2, 41.52, 0.0, 0.0, 0.0, 84.8, 53.53], "audiomae_on_audioset": [null, null, null, [["music", 44.48], ["speech", 25.97], ["musical instrument", 3.33]], [["music", 44.01], ["speech", 24.82], ["thunk", 14.49]], null, null, [["speech", 27.09], ["sidetone", 24.32], ["inside, small room", 11.13]], null, null, null, null, null, null, null, [["speech", 55.69], ["hum", 8.26], ["mains hum", 5.65]], [["speech", 15.52], ["noise", 14.05], ["theremin", 10.08]], null, null, null, null, null], "duration": [1.6, 1.09, 0.89, 11.48, 7.58, 1.18, 1.04, 2.39, 0.32, 0.27, 3.4, 0.14, 3.16, 1.07, 0.69, 5.9, 3.83, -0.02, 0.6, -0.16, 19.58, 16.92]} \ No newline at end of file diff --git a/annotations_filtered/j8Sb4-hMhCg_filtered.json b/annotations_filtered/j8Sb4-hMhCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69ce382a1823368c724bd7c5794fc5b43e404f8 --- /dev/null +++ b/annotations_filtered/j8Sb4-hMhCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 27.06], [33.0, 33.42], [33.0, 49.49], [52.0, 52.71], [53.0, 59.49], [62.0, 92.16], [95.0, 103.99], [106.0, 116.23], [120.0, 123.09]], "keep_status": [true, false, true, false, true, false, true, true, true], "silence_prob": [28.61, 0.0, 28.87, 0.0, 30.64, 0.0, 28.5, 29.48, 32.21], "audiomae_on_audioset": [[["music", 29.6], ["whack, thwack", 16.79], ["musical instrument", 4.74]], null, [["music", 39.77], ["whack, thwack", 14.32], ["sound effect", 8.26]], null, [["hum", 27.44], ["speech", 17.26], ["music", 9.52]], null, [["grunt", 19.16], ["sound effect", 16.96], ["music", 12.66]], [["whack, thwack", 34.89], ["sound effect", 11.96], ["breaking", 9.65]], [["music", 41.85], ["breaking", 13.44], ["hum", 5.23]]], "duration": [16.06, 0.42, 16.49, 0.71, 6.49, 30.16, 8.99, 10.23, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/j8cGENcePl0_filtered.json b/annotations_filtered/j8cGENcePl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547838df3d080f02fef44f39d34097d09e949e86 --- /dev/null +++ b/annotations_filtered/j8cGENcePl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.88], [12.0, 16.31], [19.0, 29.2], [35.0, 41.03], [45.0, 45.94], [47.0, 56.94], [58.0, 63.95], [66.0, 68.22], [69.0, 95.52], [97.0, 104.3], [105.0, 122.62], [124.0, 124.09]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 39.35, 37.88, 36.86, 0.0, 34.37, 32.47, 33.1, 32.05, 34.01, 32.45, 0.0], "audiomae_on_audioset": [null, [["music", 60.89], ["musical instrument", 6.27], ["guitar", 3.35]], [["boing", 39.0], ["music", 17.9], ["fly, housefly", 17.11]], [["music", 74.93], ["speech", 10.38], ["boing", 3.53]], null, [["music", 56.58], ["speech", 17.04], ["throbbing", 2.8]], [["music", 63.24], ["boing", 6.66], ["electronic music", 4.09]], [["sidetone", 44.04], ["music", 14.19], ["moo", 4.78]], [["music", 50.53], ["speech", 15.63], ["boing", 5.15]], [["music", 47.04], ["boing", 8.9], ["throbbing", 3.24]], [["livestock, farm animals, working animals", 44.18], ["cattle, bovinae", 13.58], ["moo", 11.36]], null], "duration": [0.88, 4.31, 10.2, 6.03, 0.94, 9.94, 5.95, 2.22, 26.52, 7.3, 17.62, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/j8nLPMys3b8_filtered.json b/annotations_filtered/j8nLPMys3b8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86a92ca104f8112798a9b823e57865c065717794 --- /dev/null +++ b/annotations_filtered/j8nLPMys3b8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 44.07], [48.0, 80.43], [81.0, 106.91], [109.0, 122.57], [125.0, 137.19], [139.0, 139.06], [141.0, 142.48], [145.0, 184.2]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.55, 41.26, 31.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 56.01], ["breaking", 20.63], ["glass", 3.69]], [["music", 80.66], ["theremin", 6.27], ["scary music", 2.77]], [["music", 40.54], ["hum", 20.14], ["mains hum", 10.92]], null, null, null], "duration": [38.07, 32.43, 25.91, 13.57, 12.19, 0.06, 1.48, 39.2]} \ No newline at end of file diff --git a/annotations_filtered/j8nZBlPfR7Y_filtered.json b/annotations_filtered/j8nZBlPfR7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef090cb9822a4acf9d4cb00c54a3e100ddcae2f4 --- /dev/null +++ b/annotations_filtered/j8nZBlPfR7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [11.0, 11.53], [15.0, 22.5], [24.0, 24.51], [26.0, 26.18], [27.0, 27.7], [28.0, 31.6], [33.0, 34.23], [38.0, 39.01], [40.0, 40.68], [49.0, 50.62], [54.0, 56.42], [58.0, 58.5], [59.0, 59.91], [61.0, 61.91]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 32.91, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["throbbing", 30.21], ["hum", 13.06], ["whack, thwack", 9.39]], null, null, null, null, null, null, null, null], "duration": [0.54, 0.53, 7.5, 0.51, 0.18, 0.7, 3.6, 1.23, 1.01, 0.68, 1.62, 2.42, 0.5, 0.91, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/j8yAjWvAqyM_filtered.json b/annotations_filtered/j8yAjWvAqyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee9ad9f26a83f286f32175c74532e7ffaeb9179e --- /dev/null +++ b/annotations_filtered/j8yAjWvAqyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [4.0, 3.99], [13.0, 17.81], [27.0, 29.17], [29.0, 29.86], [32.0, 34.97]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.28, 38.87, 0.0, 68.28], "audiomae_on_audioset": [null, null, [["music", 60.09], ["musical instrument", 7.96], ["speech", 3.6]], [["music", 48.15], ["carnatic music", 23.47], ["musical instrument", 5.19]], null, null], "duration": [0.37, -0.01, 4.81, 2.17, 0.86, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/j91DsC7XvdQ_filtered.json b/annotations_filtered/j91DsC7XvdQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ec259c22639abf743320045544ad52a769eba50 --- /dev/null +++ b/annotations_filtered/j91DsC7XvdQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.36], [25.0, 28.09], [30.0, 31.77], [33.0, 37.34], [39.0, 43.11]], "keep_status": [false, false, false, false, false], "silence_prob": [98.73, 96.04, 0.0, 94.81, 99.36], "audiomae_on_audioset": [null, null, null, null, null], "duration": [2.36, 3.09, 1.77, 4.34, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/j91qPMHaqbg_filtered.json b/annotations_filtered/j91qPMHaqbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad105e4a68637f05e2e8c17901885efd5f2393b --- /dev/null +++ b/annotations_filtered/j91qPMHaqbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.92], [1.0, 2.84], [6.0, 7.94], [15.0, 15.99], [17.0, 20.51], [22.0, 22.45], [23.0, 24.09], [28.0, 32.44], [33.0, 35.24], [40.0, 42.96], [56.0, 58.48], [60.0, 60.76], [61.0, 61.5], [72.0, 72.35], [83.0, 85.43], [87.0, 89.02], [91.0, 92.62], [95.0, 97.68], [100.0, 104.58], [105.0, 108.53], [110.0, 110.69], [114.0, 115.11], [129.0, 133.42], [135.0, 140.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 56.4, 40.41, 54.83, 59.07, 0.0, 0.0, 0.0, 51.44, 98.8, 0.0, 100.0, 44.93, 38.72, 0.0, 0.0, 97.0, 77.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 71.96], ["sidetone", 8.41], ["noise", 2.6]], null, null, null, null, null, null, null, null, null, [["speech", 94.31], ["music", 0.83], ["inside, small room", 0.76]], [["speech", 35.54], ["music", 29.46], ["inside, small room", 5.11]], null, null, null, null], "duration": [-0.08, 1.84, 1.94, 0.99, 3.51, 0.45, 1.09, 4.44, 2.24, 2.96, 2.48, 0.76, 0.5, 0.35, 2.43, 2.02, 1.62, 2.68, 4.58, 3.53, 0.69, 1.11, 4.42, 5.26]} \ No newline at end of file diff --git a/annotations_filtered/j95Tk1SLXOA_filtered.json b/annotations_filtered/j95Tk1SLXOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa2ddb2a3d82399348cd03b78fa7b18d78f57489 --- /dev/null +++ b/annotations_filtered/j95Tk1SLXOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.89], [8.0, 11.57], [17.0, 19.11], [20.0, 20.22], [20.0, 20.26], [20.0, 20.29], [20.0, 20.36], [20.0, 22.55], [23.0, 24.26], [38.0, 39.24], [40.0, 45.67], [49.0, 50.4], [51.0, 73.65], [74.0, 75.63], [76.0, 93.88], [95.0, 95.44], [96.0, 102.71], [103.0, 103.42], [103.0, 103.57], [104.0, 103.79], [104.0, 107.72], [109.0, 122.15], [122.0, 125.22], [129.0, 130.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 100.0, 98.01, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 100.0, 0.0, 99.98, 0.0, 96.29, 0.0, 99.87, 0.0, 0.0, 0.0, 99.98, 99.99, 95.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.89, 3.57, 2.11, 0.22, 0.26, 0.29, 0.36, 2.55, 1.26, 1.24, 5.67, 1.4, 22.65, 1.63, 17.88, 0.44, 6.71, 0.42, 0.57, -0.21, 3.72, 13.15, 3.22, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/jA-BCSOaa4Q_filtered.json b/annotations_filtered/jA-BCSOaa4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7874d819d9edd2cb3a83dd26df5c6c944a50f1dc --- /dev/null +++ b/annotations_filtered/jA-BCSOaa4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 29.73], [49.0, 48.74], [53.0, 53.49], [54.0, 56.05], [62.0, 63.32], [64.0, 65.33], [76.0, 77.21], [81.0, 81.06], [81.0, 83.89], [85.0, 89.75], [90.0, 92.13], [106.0, 106.51], [108.0, 108.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 87.55, 99.97, 97.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.27, -0.26, 0.49, 2.05, 1.32, 1.33, 1.21, 0.06, 2.89, 4.75, 2.13, 0.51, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/jA0RnDQiFbQ_filtered.json b/annotations_filtered/jA0RnDQiFbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78b969523ad865655aa94efca06d85d7fdc4bbd1 --- /dev/null +++ b/annotations_filtered/jA0RnDQiFbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.79], [9.0, 9.61], [11.0, 11.85], [25.0, 27.19], [29.0, 30.47], [33.0, 33.66], [41.0, 42.25], [44.0, 45.84], [48.0, 49.55], [51.0, 53.2], [56.0, 56.88], [64.0, 64.61], [69.0, 70.01], [76.0, 76.87], [78.0, 77.94], [78.0, 78.0], [78.0, 78.07], [88.0, 88.77], [106.0, 106.64], [115.0, 115.91], [127.0, 126.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.61, 0.85, 2.19, 1.47, 0.66, 1.25, 1.84, 1.55, 2.2, 0.88, 0.61, 1.01, 0.87, -0.06, 0.0, 0.07, 0.77, 0.64, 0.91, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/jA83iWbczFc_filtered.json b/annotations_filtered/jA83iWbczFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92d08bc1d6f9b507ee200e044cfa43d814a73ca1 --- /dev/null +++ b/annotations_filtered/jA83iWbczFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.3], [23.0, 24.19], [25.0, 26.15], [27.0, 27.8], [29.0, 29.15], [33.0, 34.21], [36.0, 37.18], [37.0, 38.47], [40.0, 41.71], [43.0, 46.67], [48.0, 48.05], [48.0, 48.39], [49.0, 48.93], [49.0, 50.79], [51.0, 52.42], [53.0, 53.47], [56.0, 57.3], [59.0, 59.66], [61.0, 89.01], [92.0, 99.22], [100.0, 100.72], [110.0, 114.08], [116.0, 121.56], [123.0, 130.74], [132.0, 144.91], [146.0, 146.45], [147.0, 148.34], [151.0, 152.42], [153.0, 158.82], [161.0, 161.64], [162.0, 161.69], [162.0, 162.28], [163.0, 165.75], [168.0, 168.45], [170.0, 169.96], [171.0, 171.49]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.51, 33.47, 0.0, 42.53, 44.26, 29.69, 29.35, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 27.47], ["siren", 14.91], ["emergency vehicle", 13.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 28.81], ["hum", 27.02], ["music", 23.89]], [["music", 70.99], ["scary music", 6.73], ["ambient music", 4.59]], null, [["music", 57.71], ["hum", 10.23], ["mains hum", 9.1]], [["music", 36.57], ["scary music", 23.98], ["mains hum", 12.85]], [["music", 83.19], ["speech", 2.78], ["burst, pop", 2.42]], [["speech", 24.23], ["music", 15.29], ["throbbing", 12.8]], null, null, null, [["mains hum", 22.07], ["hum", 17.08], ["speech", 6.62]], null, null, null, [["speech", 58.98], ["music", 10.54], ["whack, thwack", 5.24]], null, null, null], "duration": [20.3, 1.19, 1.15, 0.8, 0.15, 1.21, 1.18, 1.47, 1.71, 3.67, 0.05, 0.39, -0.07, 1.79, 1.42, 0.47, 1.3, 0.66, 28.01, 7.22, 0.72, 4.08, 5.56, 7.74, 12.91, 0.45, 1.34, 1.42, 5.82, 0.64, -0.31, 0.28, 2.75, 0.45, -0.04, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/jAZRevRbGME_filtered.json b/annotations_filtered/jAZRevRbGME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17cf5ccc6150020e54b2de782b03fb6eea8a7ca8 --- /dev/null +++ b/annotations_filtered/jAZRevRbGME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [6.0, 9.27], [12.0, 17.09], [20.0, 32.31], [37.0, 37.44]], "keep_status": [false, true, false, true, false], "silence_prob": [53.34, 41.68, 55.53, 38.47, 0.0], "audiomae_on_audioset": [null, [["sine wave", 27.34], ["speech", 14.92], ["tuning fork", 9.98]], null, [["music", 52.65], ["synthesizer", 7.0], ["musical instrument", 5.61]], null], "duration": [3.68, 3.27, 5.09, 12.31, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/jAZbK72VLFA_filtered.json b/annotations_filtered/jAZbK72VLFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f34fab134c6d92987a4bf297fbad828fa11561c1 --- /dev/null +++ b/annotations_filtered/jAZbK72VLFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.94], [16.0, 30.94], [38.0, 46.58], [47.0, 50.72], [51.0, 54.04], [55.0, 68.74], [69.0, 72.98], [75.0, 88.6], [94.0, 101.36], [104.0, 104.97]], "keep_status": [false, false, false, false, false, false, true, true, false, false], "silence_prob": [47.9, 44.18, 56.55, 60.42, 53.53, 53.91, 44.09, 29.95, 39.93, 0.0], "audiomae_on_audioset": [[["music", 47.37], ["scary music", 18.17], ["hum", 7.09]], [["speech", 26.98], ["music", 25.04], ["throbbing", 20.6]], null, null, null, null, [["music", 37.52], ["didgeridoo", 18.81], ["synthesizer", 6.41]], [["music", 52.22], ["explosion", 6.88], ["fart", 4.89]], [["music", 69.78], ["ambient music", 4.15], ["synthesizer", 3.82]], null], "duration": [4.94, 14.94, 8.58, 3.72, 3.04, 13.74, 3.98, 13.6, 7.36, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/jAwlK8vL8OQ_filtered.json b/annotations_filtered/jAwlK8vL8OQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e80de1381ceb9f95d0a910598c09ade325e2f066 --- /dev/null +++ b/annotations_filtered/jAwlK8vL8OQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.65], [18.0, 19.04], [20.0, 20.71], [22.0, 26.32], [27.0, 31.89], [33.0, 34.62], [36.0, 39.53], [40.0, 41.91], [43.0, 49.57], [50.0, 52.86], [54.0, 55.31], [58.0, 62.21], [65.0, 65.97], [67.0, 68.55], [69.0, 70.85], [75.0, 76.28], [80.0, 89.85], [92.0, 93.01], [97.0, 102.12], [113.0, 118.77], [120.0, 119.85], [120.0, 121.42], [122.0, 122.98], [125.0, 124.95], [128.0, 130.28], [136.0, 137.39], [145.0, 146.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 0.0, 95.91, 97.83, 0.0, 99.4, 0.0, 95.23, 97.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 96.89, 90.6, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.65, 1.04, 0.71, 4.32, 4.89, 1.62, 3.53, 1.91, 6.57, 2.86, 1.31, 4.21, 0.97, 1.55, 1.85, 1.28, 9.85, 1.01, 5.12, 5.77, -0.15, 1.42, 0.98, -0.05, 2.28, 1.39, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/jB9WGpVrYBs_filtered.json b/annotations_filtered/jB9WGpVrYBs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d3b666822a84850a50f1cf644612e25cc98044e --- /dev/null +++ b/annotations_filtered/jB9WGpVrYBs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.19], [8.0, 21.88], [23.0, 23.65], [25.0, 29.15], [29.0, 31.16], [35.0, 38.25], [44.0, 112.45]], "keep_status": [true, false, false, true, true, true, false], "silence_prob": [28.64, 29.06, 0.0, 29.45, 32.41, 29.52, 0.0], "audiomae_on_audioset": [[["music", 52.09], ["speech", 11.2], ["explosion", 3.62]], [["music", 48.57], ["speech", 26.72], ["burst, pop", 2.89]], null, [["speech", 28.26], ["mains hum", 21.67], ["music", 16.06]], [["music", 23.79], ["throbbing", 17.96], ["mains hum", 13.98]], [["speech", 28.73], ["music", 19.31], ["mains hum", 5.78]], null], "duration": [2.19, 13.88, 0.65, 4.15, 2.16, 3.25, 68.45]} \ No newline at end of file diff --git a/annotations_filtered/jBMZnAIY_Ng_filtered.json b/annotations_filtered/jBMZnAIY_Ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0f8c9324f30b3a444a6355694b57c8c6c29a3d --- /dev/null +++ b/annotations_filtered/jBMZnAIY_Ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 58.41], [62.0, 80.23], [81.0, 111.25]], "keep_status": [true, false, false], "silence_prob": [42.28, 33.66, 0.0], "audiomae_on_audioset": [[["throbbing", 31.67], ["hum", 24.78], ["mains hum", 9.06]], [["music", 58.66], ["throbbing", 9.74], ["didgeridoo", 6.27]], null], "duration": [2.41, 18.23, 30.25]} \ No newline at end of file diff --git a/annotations_filtered/jBajVRGElXY_filtered.json b/annotations_filtered/jBajVRGElXY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50bc6f339dbcc1ce7e66cb598e51891acd06975a --- /dev/null +++ b/annotations_filtered/jBajVRGElXY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.29], [14.0, 15.04], [21.0, 21.34], [23.0, 23.8], [26.0, 25.98], [28.0, 28.34], [36.0, 35.61], [41.0, 42.18], [44.0, 44.34], [54.0, 55.49], [65.0, 66.5], [73.0, 73.04], [80.0, 80.89], [82.0, 83.51], [91.0, 93.11], [94.0, 94.17], [96.0, 96.96], [103.0, 103.62], [109.0, 119.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.32, 0.0, 0.0, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.99], ["speech", 7.95], ["hum", 7.36]], null, null, null, null], "duration": [0.29, 1.04, 0.34, 0.8, -0.02, 0.34, -0.39, 1.18, 0.34, 1.49, 1.5, 0.04, 0.89, 1.51, 2.11, 0.17, 0.96, 0.62, 10.79]} \ No newline at end of file diff --git a/annotations_filtered/jBotZTDEcP8_filtered.json b/annotations_filtered/jBotZTDEcP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04a39cc6a3353c234e2c50131833dd5945036d50 --- /dev/null +++ b/annotations_filtered/jBotZTDEcP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.0], [21.0, 21.25], [22.0, 23.31], [27.0, 26.91], [30.0, 31.19], [32.0, 32.78], [34.0, 33.99], [38.0, 39.16], [40.0, 40.51], [41.0, 41.91], [43.0, 45.22], [52.0, 59.86], [65.0, 65.89], [68.0, 69.13], [71.0, 77.41], [89.0, 88.97], [91.0, 92.94], [95.0, 95.81], [98.0, 98.85], [104.0, 109.56], [111.0, 115.75], [122.0, 122.88], [125.0, 125.91], [145.0, 145.91], [147.0, 148.39], [152.0, 152.0], [158.0, 158.65]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 30.73, 0.0, 0.0, 30.66, 0.0, 0.0, 0.0, 0.0, 46.97, 38.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.97], ["croak", 12.46], ["speech", 7.82]], null, null, null, null, null, null, null, null, null, null, [["music", 70.25], ["speech", 10.68], ["thunk", 2.43]], null, null, [["music", 48.66], ["thunk", 29.06], ["whack, thwack", 4.65]], null, null, null, null, [["music", 42.55], ["theremin", 16.25], ["speech", 15.0]], [["livestock, farm animals, working animals", 36.08], ["moo", 32.43], ["cattle, bovinae", 24.06]], null, null, null, null, null, null], "duration": [2.0, 0.25, 1.31, -0.09, 1.19, 0.78, -0.01, 1.16, 0.51, 0.91, 2.22, 7.86, 0.89, 1.13, 6.41, -0.03, 1.94, 0.81, 0.85, 5.56, 4.75, 0.88, 0.91, 0.91, 1.39, 0.0, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/jBxnTnikZEo_filtered.json b/annotations_filtered/jBxnTnikZEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24623618bb97f25613c2b06217b72e6fe4a9c690 --- /dev/null +++ b/annotations_filtered/jBxnTnikZEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.79], [22.0, 22.17], [24.0, 24.76], [25.0, 25.07], [25.0, 34.57], [36.0, 37.37], [45.0, 106.83], [108.0, 121.44], [125.0, 139.85], [141.0, 141.71]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [75.39, 0.0, 0.0, 0.0, 34.49, 0.0, 0.0, 31.57, 33.74, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 68.93], ["music", 6.5], ["electric shaver, electric razor", 6.34]], null, null, [["livestock, farm animals, working animals", 16.4], ["cattle, bovinae", 14.02], ["moo", 13.58]], [["hum", 36.56], ["mains hum", 26.57], ["music", 16.78]], null], "duration": [4.79, 0.17, 0.76, 0.07, 9.57, 1.37, 61.83, 13.44, 14.85, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/jCSsP6ooQf8_filtered.json b/annotations_filtered/jCSsP6ooQf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1c0664fafb0575a5f426ab4f0f5d1f1d82b5c62 --- /dev/null +++ b/annotations_filtered/jCSsP6ooQf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [4.0, 4.82], [10.0, 11.57], [12.0, 13.53], [14.0, 34.05], [37.0, 42.82], [43.0, 56.39], [59.0, 63.91], [67.0, 72.84], [82.0, 99.86], [100.0, 100.48], [101.0, 103.62], [105.0, 120.02], [121.0, 123.04], [130.0, 139.99], [142.0, 150.96], [152.0, 162.3], [166.0, 173.15], [174.0, 174.72]], "keep_status": [false, false, false, false, true, true, true, true, false, true, false, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.93, 30.1, 30.09, 30.32, 30.51, 29.49, 0.0, 29.99, 29.87, 29.62, 29.99, 30.12, 30.08, 29.81, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 24.32], ["hum", 22.91], ["mains hum", 7.44]], [["speech", 39.67], ["music", 18.61], ["mains hum", 6.97]], [["speech", 38.22], ["hum", 10.57], ["music", 9.53]], [["music", 31.25], ["speech", 12.84], ["hum", 10.07]], [["throbbing", 45.17], ["hum", 40.95], ["mains hum", 8.35]], [["speech", 27.76], ["music", 25.37], ["hum", 14.02]], null, [["speech", 39.53], ["eruption", 12.26], ["explosion", 6.64]], [["music", 38.46], ["throbbing", 8.04], ["hum", 5.89]], [["throbbing", 34.64], ["music", 23.51], ["hum", 17.48]], [["speech", 34.19], ["throbbing", 21.87], ["music", 18.23]], [["speech", 42.97], ["music", 27.04], ["throbbing", 7.44]], [["music", 24.36], ["speech", 21.29], ["hum", 21.27]], [["mains hum", 37.32], ["music", 22.1], ["hum", 21.68]], null], "duration": [0.65, 0.82, 1.57, 1.53, 20.05, 5.82, 13.39, 4.91, 5.84, 17.86, 0.48, 2.62, 15.02, 2.04, 9.99, 8.96, 10.3, 7.15, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/jCXcE6DvgLw_filtered.json b/annotations_filtered/jCXcE6DvgLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33a74c473bfe0716062c52c26fe0d9993cb08cee --- /dev/null +++ b/annotations_filtered/jCXcE6DvgLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.23], [18.0, 36.46], [40.0, 46.72], [48.0, 51.0], [52.0, 53.64], [62.0, 67.9], [70.0, 79.34], [83.0, 83.08], [90.0, 91.74], [100.0, 114.12], [117.0, 120.07], [120.0, 122.77], [125.0, 126.91], [128.0, 128.02], [134.0, 134.69], [136.0, 145.5], [148.0, 156.34], [157.0, 162.95]], "keep_status": [false, true, true, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false], "silence_prob": [45.98, 31.37, 38.25, 40.28, 0.0, 69.47, 37.05, 0.0, 0.0, 33.38, 33.56, 33.93, 0.0, 0.0, 0.0, 30.53, 33.59, 44.99], "audiomae_on_audioset": [[["music", 80.73], ["scary music", 3.16], ["soundtrack music", 2.43]], [["music", 32.42], ["theremin", 10.33], ["animal", 6.98]], [["music", 32.79], ["quack", 13.21], ["speech", 9.55]], [["music", 35.23], ["synthesizer", 9.65], ["speech", 6.37]], null, null, [["speech", 31.99], ["music", 25.2], ["sidetone", 9.35]], null, null, [["speech", 49.23], ["music", 24.5], ["vehicle", 2.01]], [["music", 36.86], ["hum", 12.41], ["mains hum", 10.16]], [["speech", 13.54], ["frog", 8.0], ["livestock, farm animals, working animals", 6.92]], null, null, null, [["speech", 35.78], ["music", 13.37], ["hum", 11.83]], [["music", 45.61], ["theremin", 41.02], ["synthesizer", 3.48]], [["music", 68.43], ["throbbing", 3.2], ["theremin", 2.08]]], "duration": [9.23, 18.46, 6.72, 3.0, 1.64, 5.9, 9.34, 0.08, 1.74, 14.12, 3.07, 2.77, 1.91, 0.02, 0.69, 9.5, 8.34, 5.95]} \ No newline at end of file diff --git a/annotations_filtered/jCatADs_uW8_filtered.json b/annotations_filtered/jCatADs_uW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4167f8195c6d85b35397a791000d5bb60ff66422 --- /dev/null +++ b/annotations_filtered/jCatADs_uW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.02], [10.0, 11.6], [15.0, 19.28], [23.0, 28.93], [29.0, 33.99], [35.0, 37.25], [55.0, 58.63], [60.0, 62.61], [67.0, 92.84], [93.0, 94.47]], "keep_status": [false, false, false, false, false, true, false, false, true, false], "silence_prob": [64.86, 0.0, 82.43, 72.75, 79.07, 38.35, 68.67, 71.14, 33.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.51], ["thunk", 8.74], ["speech", 4.34]], null, null, [["speech", 28.62], ["electric shaver, electric razor", 19.18], ["music", 12.96]], null], "duration": [5.02, 1.6, 4.28, 5.93, 4.99, 2.25, 3.63, 2.61, 25.84, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/jCh_3SFr7M4_filtered.json b/annotations_filtered/jCh_3SFr7M4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b4ca43185e7f01a4844b2f2563ee77819b6755 --- /dev/null +++ b/annotations_filtered/jCh_3SFr7M4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [14.0, 16.92], [19.0, 25.83], [26.0, 36.05], [38.0, 45.84], [47.0, 50.77], [51.0, 52.1], [54.0, 56.47], [58.0, 63.83], [64.0, 64.22], [65.0, 65.79], [66.0, 77.95], [78.0, 81.72], [85.0, 85.94]], "keep_status": [false, true, true, true, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 35.04, 41.81, 36.14, 69.88, 34.45, 0.0, 37.18, 38.2, 0.0, 0.0, 37.98, 76.37, 0.0], "audiomae_on_audioset": [null, [["boing", 24.75], ["thunk", 22.18], ["clang", 11.52]], [["speech", 26.6], ["hum", 20.97], ["synthesizer", 11.26]], [["music", 27.49], ["throbbing", 7.61], ["thunk", 5.71]], null, [["speech", 30.08], ["music", 22.15], ["clang", 9.91]], null, [["music", 24.69], ["speech", 10.16], ["synthesizer", 6.47]], [["speech", 48.38], ["music", 6.89], ["ping", 5.59]], null, null, [["speech", 39.05], ["music", 38.2], ["musical instrument", 4.49]], null, null], "duration": [1.96, 2.92, 6.83, 10.05, 7.84, 3.77, 1.1, 2.47, 5.83, 0.22, 0.79, 11.95, 3.72, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/jD4Fh0LsvjM_filtered.json b/annotations_filtered/jD4Fh0LsvjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed796d78d8d4fb810bd35cb211e57a02d8e8085c --- /dev/null +++ b/annotations_filtered/jD4Fh0LsvjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.13], [25.0, 25.88], [27.0, 27.5], [34.0, 39.33], [44.0, 47.56], [48.0, 48.2], [49.0, 49.45], [50.0, 50.97], [54.0, 54.53], [57.0, 57.3], [69.0, 69.53], [74.0, 74.06], [75.0, 76.72], [82.0, 86.39], [87.0, 87.71], [89.0, 89.9], [92.0, 92.33], [96.0, 96.62], [100.0, 100.87], [109.0, 117.44], [120.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 51.77, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.93], ["speech", 14.95], ["singing bowl", 4.87]], null], "duration": [1.13, 0.88, 0.5, 5.33, 3.56, 0.2, 0.45, 0.97, 0.53, 0.3, 0.53, 0.06, 1.72, 4.39, 0.71, 0.9, 0.33, 0.62, 0.87, 8.44, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/jDD8IQgUPEU_filtered.json b/annotations_filtered/jDD8IQgUPEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b032567901b8be5c298c520f60726c73003760b3 --- /dev/null +++ b/annotations_filtered/jDD8IQgUPEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [7.0, 7.82], [10.0, 11.08], [12.0, 12.48], [14.0, 14.35], [16.0, 17.04], [20.0, 20.49], [25.0, 25.86], [29.0, 29.03], [30.0, 30.62], [51.0, 52.08], [55.0, 56.02], [57.0, 63.19], [65.0, 65.45], [78.0, 78.7], [103.0, 102.71], [106.0, 105.53], [106.0, 106.66], [108.0, 108.99], [110.0, 110.24], [112.0, 113.41], [114.0, 114.67], [128.0, 128.22], [134.0, 135.78], [140.0, 143.11], [146.0, 146.67], [149.0, 149.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.64], ["quack", 3.67], ["honk", 2.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.82, 1.08, 0.48, 0.35, 1.04, 0.49, 0.86, 0.03, 0.62, 1.08, 1.02, 6.19, 0.45, 0.7, -0.29, -0.47, 0.66, 0.99, 0.24, 1.41, 0.67, 0.22, 1.78, 3.11, 0.67, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/jDMfIPRm7jY_filtered.json b/annotations_filtered/jDMfIPRm7jY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a2d30b0c3a7265769625c5dc4cb997bfa22cee5 --- /dev/null +++ b/annotations_filtered/jDMfIPRm7jY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.19], [6.0, 6.15], [8.0, 9.95], [13.0, 24.8], [27.0, 38.82], [41.0, 50.67], [55.0, 61.67], [64.0, 63.95], [65.0, 67.09], [70.0, 70.61], [71.0, 72.18], [74.0, 74.43], [75.0, 76.74], [78.0, 78.65], [80.0, 80.99], [82.0, 83.08], [86.0, 96.67], [97.0, 102.27], [104.0, 106.71], [108.0, 111.2], [112.0, 114.2], [115.0, 119.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.77, 30.31, 30.39, 85.35, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 60.05, 97.83, 95.23, 53.72, 98.93], "audiomae_on_audioset": [null, null, null, [["speech", 48.74], ["artillery fire", 15.22], ["explosion", 6.44]], [["livestock, farm animals, working animals", 38.21], ["cattle, bovinae", 25.67], ["breaking", 7.31]], [["livestock, farm animals, working animals", 57.78], ["cattle, bovinae", 24.25], ["moo", 10.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.15, 1.95, 11.8, 11.82, 9.67, 6.67, -0.05, 2.09, 0.61, 1.18, 0.43, 1.74, 0.65, 0.99, 1.08, 10.67, 5.27, 2.71, 3.2, 2.2, 4.5]} \ No newline at end of file diff --git a/annotations_filtered/jDjZ_Dh6HSM_filtered.json b/annotations_filtered/jDjZ_Dh6HSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da4f1474dbd7549ea557641ac1387473234b191e --- /dev/null +++ b/annotations_filtered/jDjZ_Dh6HSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.15], [4.0, 4.08], [7.0, 8.01], [14.0, 16.75], [19.0, 19.43], [21.0, 23.65], [25.0, 25.03], [27.0, 26.89], [28.0, 29.93], [32.0, 31.99], [33.0, 34.82], [42.0, 45.5], [51.0, 52.78], [53.0, 55.27], [57.0, 59.56], [63.0, 63.31], [64.0, 65.16], [67.0, 67.29], [69.0, 70.58], [73.0, 73.92], [76.0, 76.1], [77.0, 77.77], [80.0, 80.69], [83.0, 83.4], [86.0, 87.34], [89.0, 90.0], [91.0, 92.74], [94.0, 95.05], [97.0, 97.19], [98.0, 100.01], [101.0, 101.85], [103.0, 104.7], [107.0, 107.81], [110.0, 110.73], [111.0, 113.24], [116.0, 116.94], [119.0, 120.39], [121.0, 121.78], [123.0, 123.87], [125.0, 125.56], [126.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.87, 74.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.08, 1.01, 2.75, 0.43, 2.65, 0.03, -0.11, 1.93, -0.01, 1.82, 3.5, 1.78, 2.27, 2.56, 0.31, 1.16, 0.29, 1.58, 0.92, 0.1, 0.77, 0.69, 0.4, 1.34, 1.0, 1.74, 1.05, 0.19, 2.01, 0.85, 1.7, 0.81, 0.73, 2.24, 0.94, 1.39, 0.78, 0.87, 0.56, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/jDmw_MLAQSU_filtered.json b/annotations_filtered/jDmw_MLAQSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee31ccb84aa206a1ce2d141a24ae4c89bf6aea0 --- /dev/null +++ b/annotations_filtered/jDmw_MLAQSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.87], [12.0, 38.1], [41.0, 41.18], [50.0, 55.68], [57.0, 57.5], [59.0, 69.92], [72.0, 119.11], [120.0, 120.45], [123.0, 126.25]], "keep_status": [false, false, false, true, false, false, false, false, true], "silence_prob": [91.64, 31.88, 0.0, 38.35, 0.0, 34.85, 0.0, 0.0, 47.5], "audiomae_on_audioset": [null, [["music", 71.71], ["speech", 6.63], ["didgeridoo", 5.22]], null, [["livestock, farm animals, working animals", 26.62], ["cattle, bovinae", 15.56], ["cowbell", 12.94]], null, [["speech", 37.33], ["cowbell", 27.98], ["fart", 12.15]], null, null, [["speech", 31.92], ["music", 24.59], ["sidetone", 12.91]]], "duration": [3.87, 26.1, 0.18, 5.68, 0.5, 10.92, 47.11, 0.45, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/jE5w-Jl5BSE_filtered.json b/annotations_filtered/jE5w-Jl5BSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/jE5w-Jl5BSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/jEKFfdQEbcg_filtered.json b/annotations_filtered/jEKFfdQEbcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24808308a122df0233cf76e89dc3adf322ef19cf --- /dev/null +++ b/annotations_filtered/jEKFfdQEbcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [3.0, 5.17], [7.0, 7.84], [9.0, 8.75], [11.0, 11.57], [13.0, 13.59], [15.0, 17.74], [29.0, 30.45], [35.0, 35.53], [46.0, 47.38], [48.0, 49.2], [50.0, 50.92], [53.0, 53.33], [57.0, 57.54], [62.0, 62.75], [64.0, 64.4], [65.0, 67.51], [70.0, 70.21], [71.0, 71.93], [78.0, 79.37], [80.0, 81.35], [85.0, 88.1], [91.0, 93.28], [95.0, 95.47], [97.0, 97.71], [98.0, 99.2], [102.0, 103.13], [104.0, 104.53], [105.0, 107.16], [111.0, 111.72], [116.0, 117.21], [122.0, 123.16], [123.0, 124.68], [128.0, 130.27], [134.0, 135.46], [144.0, 145.49], [146.0, 146.65], [150.0, 152.63], [154.0, 153.96], [158.0, 158.48], [160.0, 161.67], [162.0, 162.87], [164.0, 164.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 92.15, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 2.17, 0.84, -0.25, 0.57, 0.59, 2.74, 1.45, 0.53, 1.38, 1.2, 0.92, 0.33, 0.54, 0.75, 0.4, 2.51, 0.21, 0.93, 1.37, 1.35, 3.1, 2.28, 0.47, 0.71, 1.2, 1.13, 0.53, 2.16, 0.72, 1.21, 1.16, 1.68, 2.27, 1.46, 1.49, 0.65, 2.63, -0.04, 0.48, 1.67, 0.87, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/jEav9DdL4iI_filtered.json b/annotations_filtered/jEav9DdL4iI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dc8eb66ae81c7a5f2f7db1a9ab7b8e745127516 --- /dev/null +++ b/annotations_filtered/jEav9DdL4iI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.68], [38.0, 38.06], [44.0, 46.08], [51.0, 51.75], [53.0, 53.03], [54.0, 55.07], [59.0, 59.61], [64.0, 64.83], [68.0, 71.24], [71.0, 71.37], [77.0, 85.21], [104.0, 105.63], [108.0, 108.14], [116.0, 117.22], [117.0, 118.39], [119.0, 124.34], [131.0, 137.78], [138.0, 138.62], [142.0, 149.12]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false], "silence_prob": [34.2, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 35.25, 0.0, 43.45, 0.0, 0.0, 0.0, 0.0, 49.31, 58.81, 0.0, 47.05], "audiomae_on_audioset": [[["speech", 67.41], ["music", 21.02], ["animal", 1.21]], null, null, null, null, null, null, null, [["music", 17.42], ["livestock, farm animals, working animals", 13.72], ["cattle, bovinae", 12.59]], null, [["hum", 37.0], ["music", 17.55], ["speech", 14.27]], null, null, null, null, [["music", 40.0], ["clip-clop", 5.01], ["horse", 4.18]], null, null, [["music", 67.52], ["speech", 4.87], ["synthesizer", 3.67]]], "duration": [2.68, 0.06, 2.08, 0.75, 0.03, 1.07, 0.61, 0.83, 3.24, 0.37, 8.21, 1.63, 0.14, 1.22, 1.39, 5.34, 6.78, 0.62, 7.12]} \ No newline at end of file diff --git a/annotations_filtered/jEveVtZmPu0_filtered.json b/annotations_filtered/jEveVtZmPu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce73b5f57c88c8eb1fdf742e76d840e1a9ea29a1 --- /dev/null +++ b/annotations_filtered/jEveVtZmPu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.75], [7.0, 8.51], [9.0, 10.12], [11.0, 12.72], [13.0, 14.34], [16.0, 25.66], [27.0, 38.82], [39.0, 43.85], [47.0, 65.26], [69.0, 69.48], [73.0, 74.02], [78.0, 78.26], [84.0, 87.44], [89.0, 92.01], [93.0, 96.23], [98.0, 99.2], [101.0, 107.69], [110.0, 114.34], [126.0, 126.69], [129.0, 131.19], [132.0, 133.39], [134.0, 134.5], [135.0, 160.56], [163.0, 165.91], [167.0, 166.94], [168.0, 168.72]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.78, 56.18, 38.51, 32.49, 0.0, 0.0, 0.0, 35.11, 43.38, 61.67, 0.0, 35.71, 35.32, 0.0, 48.65, 0.0, 0.0, 31.32, 31.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.76], ["livestock, farm animals, working animals", 6.62], ["sheep", 5.03]], null, [["whale vocalization", 88.98], ["music", 1.15], ["animal", 0.91]], [["music", 45.08], ["speech", 11.58], ["throbbing", 8.06]], null, null, null, [["music", 43.36], ["hum", 9.83], ["throbbing", 8.2]], [["reverberation", 12.71], ["music", 11.81], ["speech", 10.31]], null, null, [["throbbing", 31.56], ["hum", 27.38], ["music", 17.06]], [["speech", 33.43], ["music", 29.18], ["electronic music", 1.85]], null, [["music", 47.43], ["foghorn", 22.69], ["theremin", 5.74]], null, null, [["fly, housefly", 23.85], ["music", 21.4], ["insect", 15.0]], [["speech", 40.04], ["music", 16.03], ["sidetone", 6.84]], null, null], "duration": [-0.25, 1.51, 1.12, 1.72, 1.34, 9.66, 11.82, 4.85, 18.26, 0.48, 1.02, 0.26, 3.44, 3.01, 3.23, 1.2, 6.69, 4.34, 0.69, 2.19, 1.39, 0.5, 25.56, 2.91, -0.06, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/jF6JN1VSpmY_filtered.json b/annotations_filtered/jF6JN1VSpmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e54551c482fb1f1b6fe1911a86d5ac21b694e13a --- /dev/null +++ b/annotations_filtered/jF6JN1VSpmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.15], [20.0, 21.69], [24.0, 25.22], [35.0, 35.36], [36.0, 36.19], [38.0, 38.58], [42.0, 43.85], [45.0, 47.41], [48.0, 49.47], [50.0, 52.54], [53.0, 64.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.69, 0.0, 90.25, 58.22], "audiomae_on_audioset": [[["music", 57.27], ["throbbing", 15.5], ["hum", 9.28]], null, null, null, null, null, null, [["breaking", 55.99], ["music", 29.31], ["speech", 2.07]], null, null, null], "duration": [3.15, 1.69, 1.22, 0.36, 0.19, 0.58, 1.85, 2.41, 1.47, 2.54, 11.25]} \ No newline at end of file diff --git a/annotations_filtered/jF9GE50ioFo_filtered.json b/annotations_filtered/jF9GE50ioFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f21bd799b1d5be8b1950d85495e5b7a17ec7c1 --- /dev/null +++ b/annotations_filtered/jF9GE50ioFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [18.0, 20.87], [23.0, 24.87], [47.0, 47.71], [55.0, 60.3], [65.0, 74.78], [81.0, 81.26], [91.0, 90.95], [91.0, 91.3], [91.0, 105.24], [107.0, 108.28], [112.0, 112.28], [114.0, 114.84], [121.0, 125.95], [129.0, 129.2], [130.0, 130.62], [131.0, 147.29], [165.0, 166.18], [169.0, 171.04], [174.0, 182.12]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 56.48, 0.0, 0.0, 37.92, 50.51, 0.0, 0.0, 0.0, 41.81, 0.0, 0.0, 0.0, 42.74, 0.0, 0.0, 36.78, 0.0, 66.51, 47.78], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 33.23], ["music", 20.75], ["hum", 14.78]], null, null, null, null, [["music", 68.77], ["speech", 10.81], ["throbbing", 3.45]], null, null, null, [["music", 69.12], ["musical instrument", 5.77], ["synthesizer", 4.59]], null, null, [["music", 66.63], ["synthesizer", 8.09], ["musical instrument", 4.42]], null, null, [["music", 43.48], ["speech", 15.07], ["musical instrument", 6.87]]], "duration": [1.05, 2.87, 1.87, 0.71, 5.3, 9.78, 0.26, -0.05, 0.3, 14.24, 1.28, 0.28, 0.84, 4.95, 0.2, 0.62, 16.29, 1.18, 2.04, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/jFQAy28o7Kc_filtered.json b/annotations_filtered/jFQAy28o7Kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca7ba27312c346524df4996869f587354c214b78 --- /dev/null +++ b/annotations_filtered/jFQAy28o7Kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.45], [30.0, 29.93], [34.0, 36.0], [45.0, 44.79], [49.0, 49.18], [50.0, 59.58], [62.0, 78.92], [81.0, 91.96], [93.0, 93.83], [95.0, 95.12], [96.0, 96.03], [104.0, 104.79], [105.0, 107.2], [108.0, 108.36], [111.0, 110.86], [111.0, 111.82]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 47.66, 0.0, 0.0, 30.15, 29.41, 30.71, 0.0, 0.0, 0.0, 0.0, 43.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 17.48], ["music", 17.15], ["throbbing", 16.27]], null, null, [["speech", 45.19], ["music", 35.56], ["musical instrument", 2.39]], [["cattle, bovinae", 32.99], ["livestock, farm animals, working animals", 27.98], ["moo", 16.69]], [["music", 69.87], ["whack, thwack", 3.44], ["sound effect", 3.29]], null, null, null, null, [["sidetone", 18.46], ["hum", 15.44], ["speech", 12.77]], null, null, null], "duration": [0.45, -0.07, 2.0, -0.21, 0.18, 9.58, 16.92, 10.96, 0.83, 0.12, 0.03, 0.79, 2.2, 0.36, -0.14, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/jFQUE_6Zhn0_filtered.json b/annotations_filtered/jFQUE_6Zhn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b368b2eb4f5ee9602530c46ea16f0e3e17c8589 --- /dev/null +++ b/annotations_filtered/jFQUE_6Zhn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [7.0, 9.27], [10.0, 39.8], [41.0, 42.5], [51.0, 54.09], [62.0, 67.63], [75.0, 88.53], [91.0, 135.53], [137.0, 143.92], [146.0, 155.41]], "keep_status": [false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 40.26, 32.08, 0.0, 39.3, 53.59, 36.84, 0.0, 29.64, 29.78], "audiomae_on_audioset": [null, [["music", 54.16], ["theremin", 18.29], ["didgeridoo", 4.04]], [["music", 42.43], ["theremin", 17.18], ["hum", 7.79]], null, [["whale vocalization", 85.31], ["stomach rumble", 4.84], ["liquid", 1.31]], null, [["music", 59.0], ["didgeridoo", 8.92], ["speech", 5.05]], null, [["throbbing", 31.1], ["music", 22.97], ["hum", 18.71]], [["music", 30.36], ["animal", 4.84], ["throbbing", 4.21]]], "duration": [0.71, 2.27, 29.8, 1.5, 3.09, 5.63, 13.53, 44.53, 6.92, 9.41]} \ No newline at end of file diff --git a/annotations_filtered/jFWnVdsSgxs_filtered.json b/annotations_filtered/jFWnVdsSgxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8777c4841dc462eebc7e536c946847b87ba6111 --- /dev/null +++ b/annotations_filtered/jFWnVdsSgxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 28.61], [29.0, 36.17], [38.0, 41.12], [44.0, 45.52], [47.0, 47.92], [49.0, 56.47], [59.0, 66.51], [69.0, 76.77], [83.0, 86.49], [98.0, 126.3], [129.0, 142.25], [145.0, 145.62], [147.0, 154.14], [155.0, 196.97]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [33.0, 31.48, 30.87, 0.0, 0.0, 33.09, 31.73, 32.97, 33.08, 30.76, 31.39, 0.0, 31.86, 0.0], "audiomae_on_audioset": [[["hum", 44.34], ["music", 22.87], ["mains hum", 8.44]], [["hum", 37.56], ["throbbing", 22.85], ["music", 17.65]], [["music", 43.0], ["boing", 9.76], ["hum", 9.72]], null, null, [["music", 23.62], ["didgeridoo", 14.05], ["sound effect", 9.57]], [["music", 52.69], ["hum", 11.34], ["throbbing", 5.25]], [["music", 49.38], ["speech", 19.59], ["throbbing", 5.85]], [["music", 48.91], ["didgeridoo", 19.49], ["singing", 4.11]], [["music", 71.04], ["house music", 4.66], ["electronic music", 3.81]], [["music", 63.44], ["throbbing", 4.91], ["electronic music", 4.31]], null, [["music", 63.79], ["house music", 4.03], ["synthetic singing", 3.71]], null], "duration": [14.61, 7.17, 3.12, 1.52, 0.92, 7.47, 7.51, 7.77, 3.49, 28.3, 13.25, 0.62, 7.14, 41.97]} \ No newline at end of file diff --git a/annotations_filtered/jFjy1RkmXUg_filtered.json b/annotations_filtered/jFjy1RkmXUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca9d2233ffcb7bc4ce185c967bc2eadd7c24aa02 --- /dev/null +++ b/annotations_filtered/jFjy1RkmXUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.71], [8.0, 8.24], [13.0, 13.73], [18.0, 19.52], [23.0, 24.12], [26.0, 26.69], [30.0, 29.83], [32.0, 32.34], [34.0, 35.6], [37.0, 38.89], [40.0, 40.63], [43.0, 43.9], [49.0, 49.27], [59.0, 60.05], [62.0, 64.5], [67.0, 67.76], [69.0, 69.85], [84.0, 92.84], [100.0, 99.72], [102.0, 106.57], [107.0, 108.63], [110.0, 110.62], [113.0, 113.39], [119.0, 121.19], [127.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.98, 0.0, 0.0, 29.07, 0.0, 29.43, 0.0, 0.0, 0.0, 29.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.89], ["livestock, farm animals, working animals", 15.1], ["cattle, bovinae", 12.49]], null, [["music", 54.11], ["choir", 17.04], ["singing", 8.99]], null, null, null, [["music", 30.85], ["electric shaver, electric razor", 13.55], ["buzzer", 10.11]], null], "duration": [1.71, 0.24, 0.73, 1.52, 1.12, 0.69, -0.17, 0.34, 1.6, 1.89, 0.63, 0.9, 0.27, 1.05, 2.5, 0.76, 0.85, 8.84, -0.28, 4.57, 1.63, 0.62, 0.39, 2.19, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/jFoUWFmM-NU_filtered.json b/annotations_filtered/jFoUWFmM-NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b519e7e0dbc5d77af62dd3d454bd937a0142309 --- /dev/null +++ b/annotations_filtered/jFoUWFmM-NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 46.99], [87.0, 88.05], [93.0, 93.48], [107.0, 107.72], [146.0, 148.31], [155.0, 155.93], [179.0, 179.88]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 50.4], ["animal", 3.45], ["livestock, farm animals, working animals", 2.73]], null, null], "duration": [-0.01, 1.05, 0.48, 0.72, 2.31, 0.93, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/jFrVoG-edFc_filtered.json b/annotations_filtered/jFrVoG-edFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/jFrVoG-edFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/jG7W6jwCSd0_filtered.json b/annotations_filtered/jG7W6jwCSd0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86f822eef418d43f4851bb76647d93a075ccdbf5 --- /dev/null +++ b/annotations_filtered/jG7W6jwCSd0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.25], [11.0, 19.82], [21.0, 23.45], [25.0, 26.94], [31.0, 34.1], [36.0, 37.83], [40.0, 41.32], [46.0, 46.2], [47.0, 46.7], [47.0, 48.63], [50.0, 55.7], [57.0, 59.07], [59.0, 60.74], [68.0, 69.09], [74.0, 83.0], [85.0, 85.89], [90.0, 90.54], [93.0, 94.17]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.35, 36.7, 0.0, 35.66, 0.0, 0.0, 0.0, 0.0, 0.0, 33.18, 32.24, 0.0, 0.0, 32.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.86], ["guitar", 4.24], ["speech", 3.94]], [["music", 51.41], ["guitar", 6.21], ["bass guitar", 5.88]], null, [["music", 65.69], ["guitar", 8.09], ["musical instrument", 6.93]], null, null, null, null, null, [["music", 72.5], ["guitar", 2.75], ["singing", 2.63]], [["music", 70.29], ["musical instrument", 4.03], ["plucked string instrument", 2.76]], null, null, [["music", 81.8], ["singing", 2.14], ["folk music", 1.64]], null, null, null], "duration": [0.25, 8.82, 2.45, 1.94, 3.1, 1.83, 1.32, 0.2, -0.3, 1.63, 5.7, 2.07, 1.74, 1.09, 9.0, 0.89, 0.54, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/jGAsihLnYqM_filtered.json b/annotations_filtered/jGAsihLnYqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ec2cf8e05a2fa0d1a128daef3e6c9f115e66adb --- /dev/null +++ b/annotations_filtered/jGAsihLnYqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.39], [7.0, 7.69], [8.0, 9.34], [10.0, 12.01], [22.0, 22.89], [25.0, 29.64], [35.0, 36.34], [37.0, 37.32], [41.0, 41.3], [48.0, 48.14], [50.0, 81.6], [82.0, 84.01], [85.0, 85.77], [86.0, 89.68], [90.0, 92.8], [94.0, 96.52], [97.0, 100.23], [103.0, 104.31], [106.0, 107.52], [110.0, 113.68], [115.0, 116.28], [122.0, 123.65], [124.0, 130.17], [131.0, 134.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 94.66, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 35.62, 36.22, 37.95, 41.07, 0.0, 0.0, 30.82, 0.0, 0.0, 93.6, 87.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 34.6], ["whale vocalization", 13.68], ["electronic music", 6.85]], null, [["whale vocalization", 34.12], ["music", 12.29], ["speech", 11.82]], [["whale vocalization", 66.88], ["speech", 21.27], ["music", 3.35]], [["music", 36.82], ["whale vocalization", 30.64], ["electronic music", 6.71]], [["music", 31.77], ["whale vocalization", 16.9], ["electronic music", 9.79]], null, null, [["whale vocalization", 40.33], ["music", 27.69], ["sonar", 7.28]], null, null, null, null], "duration": [4.39, 0.69, 1.34, 2.01, 0.89, 4.64, 1.34, 0.32, 0.3, 0.14, 31.6, 2.01, 0.77, 3.68, 2.8, 2.52, 3.23, 1.31, 1.52, 3.68, 1.28, 1.65, 6.17, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/jGCY8thosNw_filtered.json b/annotations_filtered/jGCY8thosNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7df10c93beda6572c8bf788adb60eb8715c3d702 --- /dev/null +++ b/annotations_filtered/jGCY8thosNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.37], [6.0, 7.38], [9.0, 10.45], [12.0, 13.29], [15.0, 17.44], [20.0, 21.83], [28.0, 29.64], [32.0, 37.18], [39.0, 41.01], [42.0, 43.92], [46.0, 47.56], [50.0, 50.01], [55.0, 56.24], [68.0, 67.71], [72.0, 72.87], [77.0, 77.97], [80.0, 80.89]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.97, 0.0, 0.0, 44.6, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 24.46], ["music", 12.57], ["speech", 10.02]], null, null, [["speech", 54.55], ["music", 22.69], ["hum", 2.44]], null, null, null, null, null, null, null, null, null], "duration": [1.37, 1.38, 1.45, 1.29, 2.44, 1.83, 1.64, 5.18, 2.01, 1.92, 1.56, 0.01, 1.24, -0.29, 0.87, 0.97, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/jGXpyMDIZ_U_filtered.json b/annotations_filtered/jGXpyMDIZ_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fcb5c1caff429d00155f03d181a25b145a649b --- /dev/null +++ b/annotations_filtered/jGXpyMDIZ_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.26], [15.0, 16.07], [20.0, 22.25], [24.0, 24.11], [26.0, 26.86], [30.0, 31.11], [32.0, 32.51], [35.0, 35.7], [37.0, 37.67], [39.0, 39.33], [41.0, 48.17], [50.0, 52.86], [54.0, 56.94], [58.0, 59.37], [61.0, 63.14], [67.0, 69.03], [70.0, 74.55], [76.0, 83.32], [87.0, 92.5], [97.0, 100.65], [101.0, 100.72], [101.0, 107.16], [108.0, 111.72], [112.0, 112.31], [112.0, 115.75], [118.0, 134.86], [137.0, 138.52], [140.0, 141.27], [143.0, 144.12], [148.0, 149.54], [156.0, 157.84], [160.0, 161.69], [162.0, 163.07], [167.0, 168.27], [171.0, 172.67], [174.0, 177.53], [178.0, 181.68], [187.0, 190.09], [193.0, 195.49], [200.0, 202.36], [203.0, 206.59], [212.0, 212.97], [219.0, 221.93], [224.0, 225.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 82.25, 78.21, 0.0, 91.47, 64.41, 55.46, 48.82, 28.38, 28.04, 0.0, 29.43, 30.39, 0.0, 30.49, 32.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 47.7, 49.78, 51.71, 66.88, 83.16, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sidetone", 81.77], ["speech", 12.99], ["music", 1.2]], null, null, null, null, null, null, [["speech", 43.26], ["music", 25.3], ["didgeridoo", 5.16]], [["speech", 69.68], ["fart", 6.78], ["music", 4.66]], [["speech", 24.64], ["mains hum", 12.92], ["hum", 6.3]], null, [["breaking", 33.72], ["whack, thwack", 14.14], ["fart", 5.04]], [["frog", 39.47], ["fart", 7.74], ["croak", 6.27]], null, [["fart", 39.0], ["didgeridoo", 23.29], ["theremin", 5.55]], [["sound effect", 10.12], ["fart", 9.5], ["boing", 9.47]], null, null, null, null, null, null, null, null, null, null, [["speech", 77.91], ["telephone bell ringing", 6.61], ["music", 2.96]], [["dog", 46.04], ["animal", 11.68], ["domestic animals, pets", 10.97]], null, null, null, null, null, null], "duration": [2.26, 1.07, 2.25, 0.11, 0.86, 1.11, 0.51, 0.7, 0.67, 0.33, 7.17, 2.86, 2.94, 1.37, 2.14, 2.03, 4.55, 7.32, 5.5, 3.65, -0.28, 6.16, 3.72, 0.31, 3.75, 16.86, 1.52, 1.27, 1.12, 1.54, 1.84, 1.69, 1.07, 1.27, 1.67, 3.53, 3.68, 3.09, 2.49, 2.36, 3.59, 0.97, 2.93, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/jH07BdMRP0g_filtered.json b/annotations_filtered/jH07BdMRP0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..892a93006bf2c2bf259876b4b7efc45f63768042 --- /dev/null +++ b/annotations_filtered/jH07BdMRP0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.67], [31.0, 32.83], [43.0, 45.1], [55.0, 55.26], [58.0, 58.41], [62.0, 61.92], [64.0, 64.59], [73.0, 73.13], [85.0, 90.39], [94.0, 95.44], [98.0, 99.52], [111.0, 111.3], [123.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.4, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 0.0, 0.0, 0.0, 47.58], "audiomae_on_audioset": [null, null, [["music", 71.65], ["drip", 2.31], ["whale vocalization", 2.24]], null, null, null, null, null, [["music", 61.78], ["electronic music", 7.06], ["throbbing", 5.36]], null, null, null, [["music", 73.98], ["speech", 3.84], ["musical instrument", 2.0]]], "duration": [1.67, 1.83, 2.1, 0.26, 0.41, -0.08, 0.59, 0.13, 5.39, 1.44, 1.52, 0.3, 6.73]} \ No newline at end of file diff --git a/annotations_filtered/jH2OKc8HPw8_filtered.json b/annotations_filtered/jH2OKc8HPw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1bcdb71727fa00358056f60b423e9a08f881b28 --- /dev/null +++ b/annotations_filtered/jH2OKc8HPw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [7.0, 9.78], [11.0, 11.3], [13.0, 12.97], [15.0, 17.56], [19.0, 19.6], [22.0, 23.26], [24.0, 26.28], [29.0, 30.2], [31.0, 31.89], [34.0, 37.07], [40.0, 40.22], [42.0, 42.15], [44.0, 46.23], [49.0, 49.3], [52.0, 54.11], [56.0, 56.35], [57.0, 58.89], [62.0, 62.8], [67.0, 68.49], [71.0, 72.74], [73.0, 74.17], [76.0, 85.4], [86.0, 87.25], [90.0, 90.83], [93.0, 92.52], [93.0, 93.55], [95.0, 95.49], [100.0, 102.78], [111.0, 111.48], [112.0, 113.64], [117.0, 118.59], [119.0, 119.1], [120.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.44, 100.0, 0.0, 0.0, 98.8, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 30.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 35.8], ["livestock, farm animals, working animals", 31.15], ["moo", 29.32]], null, null, null, null, null], "duration": [2.31, 2.78, 0.3, -0.03, 2.56, 0.6, 1.26, 2.28, 1.2, 0.89, 3.07, 0.22, 0.15, 2.23, 0.3, 2.11, 0.35, 1.89, 0.8, 1.49, 1.74, 1.17, 9.4, 1.25, 0.83, -0.48, 0.55, 0.49, 2.78, 0.48, 1.64, 1.59, 0.1, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/jHessqORWLw_filtered.json b/annotations_filtered/jHessqORWLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c69e6f4940408b4108595256969803820a1e2439 --- /dev/null +++ b/annotations_filtered/jHessqORWLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.35], [16.0, 17.47], [18.0, 55.19], [57.0, 60.51], [63.0, 65.58], [68.0, 69.31], [70.0, 72.3], [90.0, 90.71], [96.0, 96.11], [97.0, 97.75], [98.0, 99.81], [101.0, 111.32], [113.0, 114.42], [118.0, 123.69]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, true, false, true], "silence_prob": [41.72, 0.0, 0.0, 39.64, 45.43, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 35.79, 0.0, 31.18], "audiomae_on_audioset": [[["music", 57.08], ["didgeridoo", 6.81], ["musical instrument", 4.42]], null, null, [["cattle, bovinae", 49.91], ["moo", 26.64], ["livestock, farm animals, working animals", 23.21]], [["fly, housefly", 31.3], ["insect", 10.89], ["mosquito", 7.73]], null, [["speech", 22.99], ["hum", 5.61], ["sound effect", 4.5]], null, null, null, null, [["fly, housefly", 15.76], ["hum", 10.8], ["music", 10.19]], null, [["livestock, farm animals, working animals", 12.91], ["speech", 10.81], ["cattle, bovinae", 7.43]]], "duration": [2.35, 1.47, 37.19, 3.51, 2.58, 1.31, 2.3, 0.71, 0.11, 0.75, 1.81, 10.32, 1.42, 5.69]} \ No newline at end of file diff --git a/annotations_filtered/jIyn1q4Ilpw_filtered.json b/annotations_filtered/jIyn1q4Ilpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebcd93195550046634a055c6d7ffe23eb74b92ae --- /dev/null +++ b/annotations_filtered/jIyn1q4Ilpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.03], [8.0, 8.33], [22.0, 22.15], [23.0, 23.92], [26.0, 27.7], [30.0, 31.31], [33.0, 33.03], [37.0, 37.44], [51.0, 52.02], [54.0, 55.22], [62.0, 61.99], [63.0, 63.34], [67.0, 67.41], [68.0, 70.6], [76.0, 77.18], [79.0, 79.49], [81.0, 81.38], [83.0, 83.32], [92.0, 92.42], [96.0, 96.52], [98.0, 98.37], [102.0, 102.79], [107.0, 107.64], [117.0, 119.82], [120.0, 120.83], [124.0, 125.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.14], ["music", 22.29], ["sidetone", 7.34]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.03, 0.33, 0.15, 0.92, 1.7, 1.31, 0.03, 0.44, 1.02, 1.22, -0.01, 0.34, 0.41, 2.6, 1.18, 0.49, 0.38, 0.32, 0.42, 0.52, 0.37, 0.79, 0.64, 2.82, 0.83, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/jJ4zpJxcw4o_filtered.json b/annotations_filtered/jJ4zpJxcw4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df15cb436cacf18b21bc6d9ab225d775befcafed --- /dev/null +++ b/annotations_filtered/jJ4zpJxcw4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.84], [5.0, 6.37], [7.0, 9.27], [11.0, 11.13], [12.0, 12.78], [16.0, 15.77], [19.0, 18.99], [30.0, 30.18], [34.0, 35.78], [37.0, 37.05], [44.0, 46.92], [47.0, 59.53], [66.0, 93.51], [103.0, 103.01], [106.0, 108.21], [110.0, 111.5], [112.0, 114.34], [116.0, 116.63], [118.0, 118.57], [122.0, 123.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26, 31.69, 31.62, 0.0, 39.88, 0.0, 33.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.74], ["whale vocalization", 23.6], ["hum", 5.51]], null, null, null, null, null, null, null, [["bee, wasp, etc.", 41.93], ["fly, housefly", 15.98], ["insect", 11.34]], [["music", 88.05], ["musical instrument", 2.77], ["effects unit", 1.49]], [["music", 44.96], ["ambient music", 15.14], ["theremin", 11.13]], null, [["speech", 49.99], ["stomach rumble", 5.5], ["hiccup", 4.18]], null, [["speech", 66.9], ["sidetone", 4.59], ["music", 2.86]], null, null, null], "duration": [1.84, 1.37, 2.27, 0.13, 0.78, -0.23, -0.01, 0.18, 1.78, 0.05, 2.92, 12.53, 27.51, 0.01, 2.21, 1.5, 2.34, 0.63, 0.57, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/jJ8rgMkWFWA_filtered.json b/annotations_filtered/jJ8rgMkWFWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da17b7d982c26870d72e108732cab7ebeace005d --- /dev/null +++ b/annotations_filtered/jJ8rgMkWFWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 7.6], [10.0, 10.25], [15.0, 15.52], [21.0, 21.69], [23.0, 23.08], [24.0, 24.75], [26.0, 26.49], [28.0, 28.09], [30.0, 30.45], [37.0, 38.75], [39.0, 41.15], [42.0, 45.1], [47.0, 49.44], [50.0, 51.36], [55.0, 55.48], [57.0, 57.4], [61.0, 62.61], [68.0, 84.13], [86.0, 102.84], [103.0, 105.71], [106.0, 109.59], [110.0, 111.11], [113.0, 114.02], [115.0, 114.99], [118.0, 120.53], [126.0, 126.32], [129.0, 130.03], [132.0, 132.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 32.12, 32.07, 0.0, 0.0, 0.0, 0.0, 47.12, 60.05, 58.13, 54.04, 0.0, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.71], ["fly, housefly", 6.17], ["sidetone", 5.95]], [["cattle, bovinae", 35.48], ["moo", 34.76], ["livestock, farm animals, working animals", 29.23]], null, null, null, null, [["music", 47.74], ["trombone", 17.1], ["brass instrument", 12.59]], null, null, null, null, null, null, [["speech", 79.08], ["sidetone", 14.75], ["radio", 2.31]], null, null, null], "duration": [1.42, 2.6, 0.25, 0.52, 0.69, 0.08, 0.75, 0.49, 0.09, 0.45, 1.75, 2.15, 3.1, 2.44, 1.36, 0.48, 0.4, 1.61, 16.13, 16.84, 2.71, 3.59, 1.11, 1.02, -0.01, 2.53, 0.32, 1.03, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/jJHNJjwNUWM_filtered.json b/annotations_filtered/jJHNJjwNUWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a6116109986c94c423f9e6c93716f95c7469c17 --- /dev/null +++ b/annotations_filtered/jJHNJjwNUWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [4.0, 3.79], [4.0, 3.94], [14.0, 17.88], [20.0, 20.19], [23.0, 23.09], [26.0, 26.7], [30.0, 32.1], [36.0, 37.86], [42.0, 43.58], [47.0, 47.31], [56.0, 56.51], [70.0, 72.28], [73.0, 73.89], [75.0, 75.19], [77.0, 77.46], [80.0, 80.28], [81.0, 81.62], [82.0, 81.73], [98.0, 99.2], [102.0, 102.63], [110.0, 110.39], [115.0, 116.18], [116.0, 116.75], [123.0, 127.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 61.08, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.29], ["sidetone", 14.7], ["music", 8.0]]], "duration": [1.43, -0.21, -0.06, 3.88, 0.19, 0.09, 0.7, 2.1, 1.86, 1.58, 0.31, 0.51, 2.28, 0.89, 0.19, 0.46, 0.28, 0.62, -0.27, 1.2, 0.63, 0.39, 1.18, 0.75, 4.52]} \ No newline at end of file diff --git a/annotations_filtered/jJMXxv-hYPo_filtered.json b/annotations_filtered/jJMXxv-hYPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b539ee026528ec22b5b82c5a51480438d74f386c --- /dev/null +++ b/annotations_filtered/jJMXxv-hYPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [4.0, 4.28], [10.0, 11.48], [13.0, 14.23], [18.0, 18.45], [20.0, 20.07], [21.0, 22.71], [25.0, 24.65], [25.0, 25.46], [31.0, 31.58], [37.0, 39.68], [42.0, 43.11], [45.0, 45.81], [48.0, 49.35], [50.0, 51.65], [53.0, 55.76], [59.0, 60.37], [61.0, 63.42], [65.0, 65.62], [66.0, 67.9], [68.0, 69.3], [70.0, 71.9], [73.0, 73.52], [78.0, 78.49], [79.0, 80.2], [81.0, 81.67], [87.0, 87.25], [88.0, 90.76], [92.0, 121.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 31.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.62], ["music", 16.34], ["musical instrument", 4.07]]], "duration": [0.05, 0.28, 1.48, 1.23, 0.45, 0.07, 1.71, -0.35, 0.46, 0.58, 2.68, 1.11, 0.81, 1.35, 1.65, 2.76, 1.37, 2.42, 0.62, 1.9, 1.3, 1.9, 0.52, 0.49, 1.2, 0.67, 0.25, 2.76, 29.83]} \ No newline at end of file diff --git a/annotations_filtered/jJZ5x-zUx28_filtered.json b/annotations_filtered/jJZ5x-zUx28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c409cd5aee4ffe21cf574e6c68556c2cea07a98a --- /dev/null +++ b/annotations_filtered/jJZ5x-zUx28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 28.92], [34.0, 34.47], [35.0, 45.94], [48.0, 49.0], [51.0, 56.02], [57.0, 58.55], [59.0, 58.65], [59.0, 61.84], [69.0, 74.7]], "keep_status": [true, false, true, false, true, false, false, false, false], "silence_prob": [30.4, 0.0, 30.76, 0.0, 32.12, 0.0, 0.0, 31.79, 32.12], "audiomae_on_audioset": [[["music", 30.49], ["vehicle", 13.28], ["synthesizer", 6.68]], null, [["music", 39.92], ["speech", 13.35], ["theremin", 13.28]], null, [["music", 27.1], ["fowl", 13.83], ["gobble", 8.43]], null, null, [["music", 71.91], ["hum", 3.98], ["synthesizer", 3.05]], [["music", 35.4], ["mains hum", 20.07], ["hum", 16.89]]], "duration": [7.92, 0.47, 10.94, 1.0, 5.02, 1.55, -0.35, 2.84, 5.7]} \ No newline at end of file diff --git a/annotations_filtered/jJ_p_xhMEvU_filtered.json b/annotations_filtered/jJ_p_xhMEvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37a52c031b20c7e2593c081e541bf515c0c62536 --- /dev/null +++ b/annotations_filtered/jJ_p_xhMEvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.01], [17.0, 22.65], [23.0, 26.27], [26.0, 26.65], [29.0, 47.34], [51.0, 60.51], [61.0, 62.29], [63.0, 73.67]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [32.9, 36.89, 38.23, 0.0, 31.83, 31.25, 0.0, 42.46], "audiomae_on_audioset": [[["music", 39.83], ["speech", 33.22], ["explosion", 1.77]], [["music", 54.38], ["speech", 27.49], ["boing", 3.53]], [["music", 42.4], ["speech", 29.63], ["musical instrument", 3.34]], null, [["music", 61.92], ["guitar", 5.29], ["musical instrument", 4.15]], [["cattle, bovinae", 28.86], ["moo", 24.7], ["livestock, farm animals, working animals", 24.19]], null, [["speech", 57.38], ["buzz", 4.34], ["creak", 4.02]]], "duration": [6.01, 5.65, 3.27, 0.65, 18.34, 9.51, 1.29, 10.67]} \ No newline at end of file diff --git a/annotations_filtered/jJiKYmmWiCA_filtered.json b/annotations_filtered/jJiKYmmWiCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9e7b310ea02401987a5754c1388f935da615c68 --- /dev/null +++ b/annotations_filtered/jJiKYmmWiCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.99], [7.0, 6.84], [8.0, 8.48], [10.0, 10.77], [12.0, 12.66], [13.0, 14.1], [15.0, 16.46], [17.0, 17.9], [29.0, 29.84], [34.0, 34.8], [40.0, 40.53], [42.0, 41.89], [43.0, 43.36], [50.0, 51.97], [56.0, 56.62], [58.0, 58.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, -0.16, 0.48, 0.77, 0.66, 1.1, 1.46, 0.9, 0.84, 0.8, 0.53, -0.11, 0.36, 1.97, 0.62, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/jJvvT_Sb0jo_filtered.json b/annotations_filtered/jJvvT_Sb0jo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf8dffa56a8a1f9a7bf55f22b0ea4cdd9827f33d --- /dev/null +++ b/annotations_filtered/jJvvT_Sb0jo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 19.82], [20.0, 22.3], [23.0, 25.07], [27.0, 30.3], [35.0, 36.64], [40.0, 40.83], [45.0, 45.39], [62.0, 61.72], [62.0, 68.28], [71.0, 72.4], [75.0, 75.34], [79.0, 80.28], [86.0, 88.06], [90.0, 100.74], [102.0, 111.5], [113.0, 113.58], [120.0, 121.07], [125.0, 126.33], [128.0, 127.72], [136.0, 136.8], [140.0, 148.49], [150.0, 152.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 93.91, 96.17, 59.86, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 59.07, 41.87, 42.22, 0.0, 0.0, 0.0, 0.0, 0.0, 33.26, 37.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.07], ["hum", 17.51], ["music", 11.26]], [["music", 36.37], ["burping, eructation", 14.79], ["fart", 11.76]], null, null, null, null, null, [["hum", 24.41], ["music", 23.24], ["mains hum", 16.38]], [["music", 28.88], ["mains hum", 25.15], ["hum", 19.68]]], "duration": [1.51, 0.82, 2.3, 2.07, 3.3, 1.64, 0.83, 0.39, -0.28, 6.28, 1.4, 0.34, 1.28, 2.06, 10.74, 9.5, 0.58, 1.07, 1.33, -0.28, 0.8, 8.49, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/jK0s7zfdDOc_filtered.json b/annotations_filtered/jK0s7zfdDOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b2f3cea02553efd94cbae670c819d9d9cf98c83 --- /dev/null +++ b/annotations_filtered/jK0s7zfdDOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 30.13], [30.0, 64.5], [70.0, 70.85], [89.0, 92.1]], "keep_status": [true, false, false, false], "silence_prob": [30.7, 0.0, 0.0, 94.22], "audiomae_on_audioset": [[["hum", 33.49], ["throbbing", 20.19], ["mains hum", 15.2]], null, null, null], "duration": [16.13, 34.5, 0.85, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/jK4lxjvrhHs_filtered.json b/annotations_filtered/jK4lxjvrhHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dec8c10f850ac0d9c9c370046927633823c9813 --- /dev/null +++ b/annotations_filtered/jK4lxjvrhHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.64], [8.0, 8.99], [9.0, 10.39], [12.0, 13.95], [19.0, 19.67], [25.0, 24.75], [26.0, 26.0], [32.0, 32.27], [33.0, 33.47], [42.0, 41.79], [44.0, 45.01], [63.0, 63.51], [65.0, 64.72], [65.0, 66.88], [69.0, 69.13], [74.0, 73.94], [75.0, 74.85], [75.0, 76.49], [77.0, 77.28], [88.0, 89.04], [93.0, 92.96], [97.0, 97.88], [103.0, 103.71], [111.0, 112.21], [113.0, 113.09], [114.0, 115.23], [116.0, 116.09], [119.0, 119.3], [126.0, 126.18], [127.0, 130.25], [133.0, 134.3], [135.0, 136.39], [138.0, 140.14], [142.0, 142.11], [143.0, 143.72], [151.0, 152.24], [153.0, 153.96], [156.0, 157.17], [162.0, 164.1], [168.0, 168.57], [170.0, 171.27], [173.0, 172.96], [174.0, 175.41], [177.0, 177.11], [180.0, 180.49], [182.0, 183.29], [185.0, 185.94], [190.0, 190.31], [192.0, 193.18], [194.0, 194.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 31.28, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.84], ["animal", 1.47], ["livestock, farm animals, working animals", 1.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.99, 1.39, 1.95, 0.67, -0.25, 0.0, 0.27, 0.47, -0.21, 1.01, 0.51, -0.28, 1.88, 0.13, -0.06, -0.15, 1.49, 0.28, 1.04, -0.04, 0.88, 0.71, 1.21, 0.09, 1.23, 0.09, 0.3, 0.18, 3.25, 1.3, 1.39, 2.14, 0.11, 0.72, 1.24, 0.96, 1.17, 2.1, 0.57, 1.27, -0.04, 1.41, 0.11, 0.49, 1.29, 0.94, 0.31, 1.18, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/jKC6UsetwN4_filtered.json b/annotations_filtered/jKC6UsetwN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0f8340847bf5de604adf9c94b06a801b91cfc01 --- /dev/null +++ b/annotations_filtered/jKC6UsetwN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.91], [16.0, 16.01], [19.0, 19.6], [44.0, 44.2], [51.0, 51.54], [53.0, 54.14], [58.0, 59.09], [71.0, 71.49], [75.0, 74.87], [79.0, 81.21], [88.0, 88.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 0.01, 0.6, 0.2, 0.54, 1.14, 1.09, 0.49, -0.13, 2.21, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/jKCpGDv8vuY_filtered.json b/annotations_filtered/jKCpGDv8vuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3605adcb46433baf25b62533e6356a7095acde00 --- /dev/null +++ b/annotations_filtered/jKCpGDv8vuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.87], [23.0, 25.51], [28.0, 49.4], [53.0, 52.95], [53.0, 54.87]], "keep_status": [true, false, false, false, false], "silence_prob": [39.63, 69.74, 54.04, 0.0, 0.0], "audiomae_on_audioset": [[["music", 24.16], ["moo", 18.83], ["cattle, bovinae", 18.36]], null, null, null, null], "duration": [10.87, 2.51, 21.4, -0.05, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/jKGudyrV0v4_filtered.json b/annotations_filtered/jKGudyrV0v4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2827807bb3a181cc4698e11ee6d61a69e43ebf8 --- /dev/null +++ b/annotations_filtered/jKGudyrV0v4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.03], [9.0, 9.66], [12.0, 13.32], [15.0, 16.88], [21.0, 21.42], [22.0, 22.65], [29.0, 35.31], [38.0, 40.95], [50.0, 51.17], [52.0, 53.08], [57.0, 58.11], [60.0, 59.66], [63.0, 63.88], [67.0, 67.86], [69.0, 69.87], [72.0, 79.1], [84.0, 87.15], [87.0, 87.47], [87.0, 87.51], [88.0, 88.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 47.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.82], ["music", 4.13], ["speech synthesizer", 1.99]], null, null, null], "duration": [0.03, 0.66, 1.32, 1.88, 0.42, 0.65, 6.31, 2.95, 1.17, 1.08, 1.11, -0.34, 0.88, 0.86, 0.87, 7.1, 3.15, 0.47, 0.51, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/jKIG_-544gY_filtered.json b/annotations_filtered/jKIG_-544gY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad6fd9969664938e1a9783d343fd7f14a8d2edbf --- /dev/null +++ b/annotations_filtered/jKIG_-544gY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.55], [20.0, 38.42], [40.0, 46.3], [55.0, 67.37], [68.0, 68.34], [70.0, 70.58], [72.0, 84.57], [86.0, 89.02], [92.0, 92.75], [95.0, 95.66], [96.0, 103.71], [105.0, 107.08], [109.0, 121.37], [123.0, 123.45], [125.0, 124.87], [126.0, 127.23], [130.0, 130.01], [131.0, 131.48], [132.0, 134.25], [135.0, 135.19], [138.0, 139.16], [142.0, 150.15], [150.0, 150.94], [151.0, 156.24], [158.0, 158.5], [159.0, 165.7], [168.0, 169.33]], "keep_status": [false, false, true, true, false, false, true, true, false, false, false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 37.07, 35.13, 32.85, 0.0, 0.0, 30.31, 34.05, 0.0, 0.0, 33.02, 36.47, 29.55, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 0.0, 0.0, 29.33, 0.0, 30.64, 0.0, 31.13, 0.0], "audiomae_on_audioset": [null, [["hum", 30.15], ["music", 25.72], ["mains hum", 18.78]], [["music", 40.1], ["didgeridoo", 6.89], ["speech", 4.09]], [["speech", 44.44], ["fart", 11.59], ["animal", 6.81]], null, null, [["speech", 24.91], ["fart", 14.64], ["music", 12.95]], [["music", 47.81], ["theremin", 4.65], ["musical instrument", 3.97]], null, null, [["fly, housefly", 49.4], ["fart", 21.92], ["insect", 13.92]], [["music", 31.2], ["hum", 7.4], ["mains hum", 6.44]], [["speech", 34.41], ["music", 10.23], ["groan", 10.07]], null, null, null, null, null, [["vehicle", 29.93], ["boat, water vehicle", 15.39], ["motorboat, speedboat", 9.95]], null, null, [["music", 34.47], ["speech", 21.11], ["rumble", 7.41]], null, [["music", 55.28], ["speech", 21.34], ["didgeridoo", 5.59]], null, [["music", 45.14], ["foghorn", 20.15], ["fly, housefly", 5.52]], null], "duration": [1.55, 18.42, 6.3, 12.37, 0.34, 0.58, 12.57, 3.02, 0.75, 0.66, 7.71, 2.08, 12.37, 0.45, -0.13, 1.23, 0.01, 0.48, 2.25, 0.19, 1.16, 8.15, 0.94, 5.24, 0.5, 6.7, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/jKVDdMG37ig_filtered.json b/annotations_filtered/jKVDdMG37ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3619ff8a55b94aa897c1fbcb92e0fa89432a1f15 --- /dev/null +++ b/annotations_filtered/jKVDdMG37ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.78], [31.0, 49.11], [49.0, 50.25], [52.0, 61.37], [71.0, 71.41], [74.0, 74.56], [75.0, 80.84], [85.0, 86.04], [89.0, 89.07], [91.0, 91.35], [93.0, 94.12], [96.0, 96.26], [97.0, 100.26], [101.0, 102.34], [104.0, 104.35]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.64, 0.0, 33.86, 0.0, 0.0, 35.16, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 64.49], ["speech", 8.26], ["brass instrument", 6.33]], null, [["brass instrument", 34.53], ["music", 24.42], ["trombone", 11.83]], null, null, [["music", 34.1], ["didgeridoo", 11.12], ["musical instrument", 9.77]], null, null, null, null, null, null, null, null], "duration": [0.78, 18.11, 1.25, 9.37, 0.41, 0.56, 5.84, 1.04, 0.07, 0.35, 1.12, 0.26, 3.26, 1.34, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/jKXg2eMaNXU_filtered.json b/annotations_filtered/jKXg2eMaNXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db1dd58635e027ced6217414b510117f52806902 --- /dev/null +++ b/annotations_filtered/jKXg2eMaNXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [2.0, 3.6], [9.0, 13.27], [14.0, 15.13], [16.0, 18.06], [19.0, 22.45], [24.0, 24.83], [31.0, 32.59], [34.0, 36.14], [37.0, 40.04], [40.0, 42.65], [43.0, 43.71], [45.0, 54.03], [56.0, 65.1], [66.0, 67.71], [71.0, 71.41], [73.0, 74.43], [75.0, 75.29], [78.0, 80.79], [81.0, 83.46], [85.0, 86.93], [92.0, 94.27], [95.0, 100.33], [103.0, 104.33], [105.0, 106.39], [107.0, 110.15], [112.0, 113.93], [115.0, 117.73], [119.0, 119.96], [123.0, 124.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0, 99.99, 59.68, 0.0, 0.0, 99.95, 42.62, 34.48, 0.0, 43.0, 94.52, 0.0, 0.0, 0.0, 0.0, 96.29, 36.72, 0.0, 44.15, 93.29, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 42.38], ["speech", 36.3], ["music", 5.01]], [["speech", 87.36], ["radio", 2.52], ["dial tone", 2.17]], null, [["speech", 55.33], ["dial tone", 13.4], ["sine wave", 6.73]], null, null, null, null, null, null, [["speech", 46.13], ["tuning fork", 18.74], ["dial tone", 16.21]], null, [["speech", 57.83], ["music", 6.29], ["sine wave", 5.14]], null, null, null, null, null, null, null, null], "duration": [0.58, 1.6, 4.27, 1.13, 2.06, 3.45, 0.83, 1.59, 2.14, 3.04, 2.65, 0.71, 9.03, 9.1, 1.71, 0.41, 1.43, 0.29, 2.79, 2.46, 1.93, 2.27, 5.33, 1.33, 1.39, 3.15, 1.93, 2.73, 0.96, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/jKa9O33GXLI_filtered.json b/annotations_filtered/jKa9O33GXLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c87a783a8622cc6b1ddf30940a4131fc330cd7b0 --- /dev/null +++ b/annotations_filtered/jKa9O33GXLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.29], [22.0, 23.26], [25.0, 35.01], [45.0, 47.06], [49.0, 49.82], [51.0, 60.61], [64.0, 64.29], [69.0, 73.8], [79.0, 86.51], [101.0, 112.83], [114.0, 115.3], [116.0, 121.56], [123.0, 124.19]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [30.94, 0.0, 31.17, 33.61, 0.0, 29.92, 0.0, 33.96, 31.95, 29.7, 0.0, 30.86, 0.0], "audiomae_on_audioset": [[["boing", 49.72], ["music", 13.18], ["didgeridoo", 11.21]], null, [["music", 45.86], ["speech", 25.31], ["brass instrument", 6.37]], [["music", 46.06], ["trombone", 17.09], ["brass instrument", 10.06]], null, [["foghorn", 31.12], ["speech", 19.22], ["music", 8.84]], null, [["speech", 28.98], ["music", 27.56], ["sidetone", 7.46]], [["music", 32.87], ["speech", 18.51], ["brass instrument", 13.07]], [["livestock, farm animals, working animals", 43.29], ["cattle, bovinae", 22.8], ["moo", 21.14]], null, [["music", 47.92], ["foghorn", 19.84], ["didgeridoo", 5.87]], null], "duration": [4.29, 1.26, 10.01, 2.06, 0.82, 9.61, 0.29, 4.8, 7.51, 11.83, 1.3, 5.56, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/jKyhNbLEKxY_filtered.json b/annotations_filtered/jKyhNbLEKxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b689ab512f987fd76d92379c102129fd2e9fd93 --- /dev/null +++ b/annotations_filtered/jKyhNbLEKxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.77], [23.0, 25.46], [29.0, 29.37], [31.0, 34.55], [36.0, 36.09], [39.0, 112.16], [114.0, 118.05]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 28.13, 0.0, 28.9, 0.0, 0.0, 37.12], "audiomae_on_audioset": [null, [["music", 40.57], ["vehicle", 17.42], ["car", 16.86]], null, [["music", 77.74], ["throbbing", 7.16], ["electronic music", 3.18]], null, null, [["music", 13.5], ["noise", 12.28], ["white noise", 10.47]]], "duration": [1.77, 2.46, 0.37, 3.55, 0.09, 73.16, 4.05]} \ No newline at end of file diff --git a/annotations_filtered/jL6oromerXE_filtered.json b/annotations_filtered/jL6oromerXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e5da45210b57be325a91a5bd52cca079acbfd45 --- /dev/null +++ b/annotations_filtered/jL6oromerXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [0.0, 1.75], [14.0, 18.96], [22.0, 33.4], [39.0, 41.45], [42.0, 46.11], [48.0, 48.36], [50.0, 51.44], [53.0, 55.54], [66.0, 66.26], [68.0, 68.49], [88.0, 88.67], [97.0, 98.69], [102.0, 106.56]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.02, 32.18, 34.0, 32.19, 0.0, 0.0, 43.1, 0.0, 0.0, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, null, [["speech", 61.07], ["vehicle", 9.91], ["aircraft", 4.79]], [["cattle, bovinae", 35.22], ["livestock, farm animals, working animals", 20.82], ["moo", 13.79]], [["speech", 29.4], ["music", 26.18], ["cattle, bovinae", 3.9]], [["cattle, bovinae", 38.03], ["moo", 21.96], ["livestock, farm animals, working animals", 9.38]], null, null, [["throbbing", 62.84], ["hum", 19.74], ["mains hum", 2.29]], null, null, null, null, null], "duration": [0.33, 1.75, 4.96, 11.4, 2.45, 4.11, 0.36, 1.44, 2.54, 0.26, 0.49, 0.67, 1.69, 4.56]} \ No newline at end of file diff --git a/annotations_filtered/jL6rrLaw6rc_filtered.json b/annotations_filtered/jL6rrLaw6rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c2923b02724eeea9a062ad0698bb2da3482a54 --- /dev/null +++ b/annotations_filtered/jL6rrLaw6rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.19], [9.0, 17.96], [18.0, 33.56], [37.0, 38.55], [42.0, 41.99], [48.0, 48.63], [50.0, 65.82], [67.0, 69.4], [72.0, 74.02], [75.0, 90.29], [91.0, 92.2], [93.0, 93.39], [94.0, 103.77], [104.0, 140.68], [142.0, 142.69], [146.0, 155.7], [158.0, 163.78], [165.0, 170.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.66, 45.85, 0.0, 0.0, 0.0, 54.7, 92.64, 92.15, 77.87, 0.0, 0.0, 59.68, 0.0, 0.0, 46.12, 72.01, 85.17], "audiomae_on_audioset": [null, [["hum", 29.69], ["music", 25.01], ["throbbing", 24.92]], [["music", 20.3], ["speech", 13.84], ["theremin", 9.75]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.43], ["ambient music", 11.64], ["hum", 3.28]], null, null], "duration": [1.19, 8.96, 15.56, 1.55, -0.01, 0.63, 15.82, 2.4, 2.02, 15.29, 1.2, 0.39, 9.77, 36.68, 0.69, 9.7, 5.78, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/jLPtdXAVuwo_filtered.json b/annotations_filtered/jLPtdXAVuwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dfa382a454e7d2a7f5087d1f271fe147d52760f --- /dev/null +++ b/annotations_filtered/jLPtdXAVuwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.99], [21.0, 21.24], [32.0, 33.03], [34.0, 38.8], [88.0, 88.53], [98.0, 99.39]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.78], ["boing", 17.33], ["speech", 10.71]], null, null], "duration": [-0.01, 0.24, 1.03, 4.8, 0.53, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/jLo7tHDHgOc_filtered.json b/annotations_filtered/jLo7tHDHgOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c06aa7f9ff78ed1e6e5a201946e807c7f477e904 --- /dev/null +++ b/annotations_filtered/jLo7tHDHgOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.6], [15.0, 15.03], [16.0, 16.95], [19.0, 19.01], [20.0, 20.61], [22.0, 22.32], [40.0, 40.83], [42.0, 42.55], [43.0, 43.11], [48.0, 48.36], [50.0, 49.96], [52.0, 54.3], [55.0, 68.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 74.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.6, 0.03, 0.95, 0.01, 0.61, 0.32, 0.83, 0.55, 0.11, 0.36, -0.04, 2.3, 13.84]} \ No newline at end of file diff --git a/annotations_filtered/jLvu6WNWzKg_filtered.json b/annotations_filtered/jLvu6WNWzKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1534163e4e8f81d83eb48b0836000ebcb8a28944 --- /dev/null +++ b/annotations_filtered/jLvu6WNWzKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.19], [11.0, 10.91], [14.0, 13.81], [18.0, 18.59], [21.0, 21.37], [29.0, 29.74], [37.0, 38.48], [39.0, 41.17], [42.0, 43.33], [46.0, 47.34], [49.0, 49.77], [51.0, 54.18], [55.0, 56.83], [59.0, 59.26], [62.0, 63.21], [73.0, 74.56], [77.0, 82.73], [90.0, 89.88], [91.0, 91.49], [94.0, 94.26], [95.0, 95.47], [101.0, 106.14], [107.0, 107.49], [108.0, 108.85], [111.0, 111.28], [116.0, 116.06], [117.0, 117.85], [119.0, 120.01], [123.0, 122.99], [128.0, 131.85], [132.0, 132.7], [151.0, 165.01], [165.0, 166.97]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0, 0.0, 34.75, 0.0, 0.0, 0.0, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 30.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 31.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 30.83], ["speech", 15.68], ["didgeridoo", 10.92]], null, null, null, [["hum", 45.79], ["mains hum", 35.01], ["throbbing", 8.77]], null, null, null, null, [["throbbing", 38.76], ["hum", 24.56], ["music", 11.29]], null, null, null, null, [["music", 41.01], ["throbbing", 14.42], ["didgeridoo", 9.09]], null, null, null, null, null, null, null, [["music", 34.81], ["speech", 17.61], ["hum", 12.99]], null, [["music", 60.07], ["thunk", 9.69], ["whack, thwack", 2.95]], null], "duration": [0.19, -0.09, -0.19, 0.59, 0.37, 0.74, 1.48, 2.17, 1.33, 1.34, 0.77, 3.18, 1.83, 0.26, 1.21, 1.56, 5.73, -0.12, 0.49, 0.26, 0.47, 5.14, 0.49, 0.85, 0.28, 0.06, 0.85, 1.01, -0.01, 3.85, 0.7, 14.01, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/jM7Eou4bV-Q_filtered.json b/annotations_filtered/jM7Eou4bV-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b3a680dfeae75ffa4a5e7351a7ad83dff05b611 --- /dev/null +++ b/annotations_filtered/jM7Eou4bV-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 31.75], [37.0, 75.52], [90.0, 105.26], [105.0, 114.37], [115.0, 115.79], [117.0, 129.9], [132.0, 131.79], [133.0, 136.14], [138.0, 139.9]], "keep_status": [false, false, true, false, false, true, false, false, false], "silence_prob": [65.55, 0.0, 36.28, 39.07, 0.0, 33.45, 0.0, 71.29, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 31.69], ["livestock, farm animals, working animals", 20.87], ["moo", 14.8]], [["moo", 29.11], ["cattle, bovinae", 25.93], ["livestock, farm animals, working animals", 24.88]], null, [["whack, thwack", 19.19], ["groan", 14.1], ["thump, thud", 13.54]], null, null, null], "duration": [2.75, 38.52, 15.26, 9.37, 0.79, 12.9, -0.21, 3.14, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/jME-000LFNY_filtered.json b/annotations_filtered/jME-000LFNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3541c4d182678a39960ba598cae60b009e0ea8dc --- /dev/null +++ b/annotations_filtered/jME-000LFNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.26], [16.0, 16.93], [32.0, 32.24], [36.0, 36.8], [54.0, 56.64], [63.0, 63.76], [67.0, 73.31], [77.0, 77.67], [92.0, 91.98], [93.0, 93.97]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.15, 0.0, 34.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 49.93], ["speech", 6.94], ["didgeridoo", 2.72]], null, [["music", 37.41], ["throbbing", 21.56], ["fly, housefly", 11.19]], null, null, null], "duration": [0.26, 0.93, 0.24, 0.8, 2.64, 0.76, 6.31, 0.67, -0.02, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/jMTT0LW0M_Y_filtered.json b/annotations_filtered/jMTT0LW0M_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1d12e2fffd5667ec8bdf27b94683af207549da1 --- /dev/null +++ b/annotations_filtered/jMTT0LW0M_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.35], [8.0, 9.71], [10.0, 9.83], [10.0, 10.96], [12.0, 12.24], [14.0, 16.82], [17.0, 19.16], [20.0, 20.73], [21.0, 26.52], [28.0, 29.29], [30.0, 32.02], [34.0, 35.24], [37.0, 38.74], [41.0, 42.84], [44.0, 45.67], [47.0, 49.18], [53.0, 59.04], [67.0, 72.55], [75.0, 77.11], [80.0, 80.49], [81.0, 82.11], [86.0, 87.39], [90.0, 90.81], [93.0, 93.56], [97.0, 98.25], [100.0, 100.53], [102.0, 102.54], [103.0, 103.84], [105.0, 106.49], [107.0, 108.33], [111.0, 114.45], [117.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.21, 0.0, 0.0, 0.0, 0.0, 92.97, 90.08, 0.0, 38.94, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 31.5, 29.7, 41.64, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 31.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 25.06], ["mains hum", 18.81], ["music", 14.14]], null, null, null, null, null, null, [["music", 31.53], ["brass instrument", 11.51], ["trombone", 10.67]], [["music", 37.66], ["trombone", 12.71], ["brass instrument", 12.57]], [["music", 39.28], ["theremin", 32.22], ["musical instrument", 4.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 88.37], ["music", 8.86], ["synthesizer", 0.49]]], "duration": [3.35, 1.71, -0.17, 0.96, 0.24, 2.82, 2.16, 0.73, 5.52, 1.29, 2.02, 1.24, 1.74, 1.84, 1.67, 2.18, 6.04, 5.55, 2.11, 0.49, 1.11, 1.39, 0.81, 0.56, 1.25, 0.53, 0.54, 0.84, 1.49, 1.33, 3.45, 12.88]} \ No newline at end of file diff --git a/annotations_filtered/jMaeuWl4qHM_filtered.json b/annotations_filtered/jMaeuWl4qHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4be39142177c1747604d3dd4f2b148170147c170 --- /dev/null +++ b/annotations_filtered/jMaeuWl4qHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.23], [40.0, 41.47], [43.0, 48.83], [55.0, 57.79], [64.0, 69.84], [71.0, 75.03], [77.0, 83.1], [86.0, 94.9], [95.0, 100.58]], "keep_status": [false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.46, 48.02, 58.89, 33.41, 59.59, 41.93, 35.61], "audiomae_on_audioset": [null, null, [["music", 24.03], ["insect", 15.41], ["fly, housefly", 14.87]], [["music", 31.47], ["speech", 29.97], ["didgeridoo", 4.06]], null, [["music", 32.98], ["speech", 30.35], ["ice cream truck, ice cream van", 6.88]], null, [["hum", 48.42], ["mains hum", 35.53], ["buzz", 2.96]], [["speech", 54.51], ["hum", 15.26], ["horse", 3.69]]], "duration": [1.23, 1.47, 5.83, 2.79, 5.84, 4.03, 6.1, 8.9, 5.58]} \ No newline at end of file diff --git a/annotations_filtered/jMqI9UV3ob4_filtered.json b/annotations_filtered/jMqI9UV3ob4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde8352a3d7c2b391137190cd8395e7b61552b9a --- /dev/null +++ b/annotations_filtered/jMqI9UV3ob4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.64], [20.0, 21.91], [22.0, 22.62], [23.0, 23.9], [27.0, 26.76], [32.0, 33.67], [36.0, 36.61], [37.0, 37.45], [39.0, 42.57], [47.0, 46.9], [48.0, 48.66], [53.0, 53.59], [55.0, 55.29], [61.0, 60.79]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 19.19], ["sidetone", 15.25], ["frog", 7.67]], null, null, null, null, null], "duration": [0.64, 1.91, 0.62, 0.9, -0.24, 1.67, 0.61, 0.45, 3.57, -0.1, 0.66, 0.59, 0.29, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/jMv808xIuwg_filtered.json b/annotations_filtered/jMv808xIuwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..909e66401a01f4fd00e5e822b650a3031c4578b3 --- /dev/null +++ b/annotations_filtered/jMv808xIuwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 63.98], [65.0, 91.35]], "keep_status": [false, false], "silence_prob": [0.0, 29.47], "audiomae_on_audioset": [null, [["music", 63.79], ["speech", 8.73], ["throbbing", 3.61]]], "duration": [55.98, 26.35]} \ No newline at end of file diff --git a/annotations_filtered/jMvR4K4QICQ_filtered.json b/annotations_filtered/jMvR4K4QICQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..028dd8f5d45776bf20914352031c38965bc2d84b --- /dev/null +++ b/annotations_filtered/jMvR4K4QICQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.42], [17.0, 27.82], [32.0, 33.37], [35.0, 38.6], [41.0, 43.41], [44.0, 44.98], [46.0, 51.73], [52.0, 52.89], [54.0, 55.14], [56.0, 57.89], [59.0, 59.73], [60.0, 63.59], [65.0, 121.66], [123.0, 123.48], [126.0, 144.96], [146.0, 164.74], [165.0, 165.18]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.77, 38.76, 0.0, 33.3, 44.96, 0.0, 28.71, 0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 28.52, 28.57, 0.0], "audiomae_on_audioset": [[["music", 40.88], ["hum", 27.09], ["throbbing", 13.31]], [["music", 69.3], ["hum", 2.72], ["scary music", 2.51]], null, [["music", 26.97], ["hum", 20.43], ["shuffling cards", 11.84]], [["music", 38.77], ["hum", 14.81], ["mains hum", 8.52]], null, [["music", 44.1], ["speech", 6.46], ["whack, thwack", 5.6]], null, null, null, null, [["speech", 50.42], ["music", 16.33], ["sidetone", 8.17]], null, null, [["music", 69.09], ["speech", 5.37], ["electric shaver, electric razor", 4.88]], [["music", 62.65], ["groan", 7.11], ["whack, thwack", 5.32]], null], "duration": [14.42, 10.82, 1.37, 3.6, 2.41, 0.98, 5.73, 0.89, 1.14, 1.89, 0.73, 3.59, 56.66, 0.48, 18.96, 18.74, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/jMxYv05A7B0_filtered.json b/annotations_filtered/jMxYv05A7B0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de058c46c4b965c95ee0b186877a1af5bedee7da --- /dev/null +++ b/annotations_filtered/jMxYv05A7B0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.8], [6.0, 6.57], [11.0, 12.99], [17.0, 17.58], [18.0, 18.17], [27.0, 27.04], [35.0, 36.26], [38.0, 38.33], [41.0, 41.05], [51.0, 51.41], [66.0, 66.82], [73.0, 73.84], [76.0, 77.19], [78.0, 81.16], [84.0, 85.45], [86.0, 87.24], [88.0, 89.61], [91.0, 91.1], [91.0, 92.94], [96.0, 96.7], [97.0, 98.41], [105.0, 105.87], [114.0, 115.25], [119.0, 120.38], [121.0, 122.98], [124.0, 125.76], [127.0, 130.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 0.57, 1.99, 0.58, 0.17, 0.04, 1.26, 0.33, 0.05, 0.41, 0.82, 0.84, 1.19, 3.16, 1.45, 1.24, 1.61, 0.1, 1.94, 0.7, 1.41, 0.87, 1.25, 1.38, 1.98, 1.76, 3.82]} \ No newline at end of file diff --git a/annotations_filtered/jNN6FI1Gcr8_filtered.json b/annotations_filtered/jNN6FI1Gcr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c47817c6385d5d2e33a095cfc6cd5392ff52fa0f --- /dev/null +++ b/annotations_filtered/jNN6FI1Gcr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.09], [19.0, 19.77], [22.0, 22.4], [27.0, 28.75], [30.0, 30.33], [41.0, 41.49], [43.0, 44.66], [45.0, 45.89], [47.0, 47.49], [53.0, 53.15], [55.0, 55.44], [57.0, 58.29], [61.0, 62.63], [67.0, 68.3], [80.0, 80.3], [93.0, 93.66], [96.0, 97.33], [98.0, 110.12], [112.0, 113.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.77, 0.4, 1.75, 0.33, 0.49, 1.66, 0.89, 0.49, 0.15, 0.44, 1.29, 1.63, 1.3, 0.3, 0.66, 1.33, 12.12, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/jNNX5a8ogr8_filtered.json b/annotations_filtered/jNNX5a8ogr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c9efe97be7af0e7560818d3b215f2efeb40460 --- /dev/null +++ b/annotations_filtered/jNNX5a8ogr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 64.56], [66.0, 95.99], [100.0, 105.33], [109.0, 111.81], [114.0, 116.87], [120.0, 121.91], [123.0, 129.07], [130.0, 140.95], [146.0, 149.17], [151.0, 163.14], [164.0, 165.96], [168.0, 168.62], [169.0, 171.68]], "keep_status": [false, false, true, false, true, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 32.37, 42.22, 59.68, 45.95, 0.0, 38.62, 36.18, 34.82, 34.48, 0.0, 0.0, 48.06], "audiomae_on_audioset": [null, [["music", 79.73], ["theremin", 8.76], ["musical instrument", 1.07]], [["music", 45.62], ["theremin", 9.62], ["hum", 6.41]], null, [["music", 41.91], ["synthesizer", 9.58], ["didgeridoo", 8.31]], null, [["music", 43.6], ["electronic music", 12.8], ["whale vocalization", 8.75]], [["theremin", 62.29], ["music", 19.73], ["musical instrument", 2.53]], [["music", 26.85], ["ambient music", 16.39], ["gong", 11.4]], [["music", 28.85], ["ambient music", 22.98], ["hum", 11.04]], null, null, [["music", 45.32], ["electronic music", 11.82], ["ambient music", 7.14]]], "duration": [44.56, 29.99, 5.33, 2.81, 2.87, 1.91, 6.07, 10.95, 3.17, 12.14, 1.96, 0.62, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/jNPBfvcLIMs_filtered.json b/annotations_filtered/jNPBfvcLIMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0948bac0984dde69213be175659afe14ed36a7e2 --- /dev/null +++ b/annotations_filtered/jNPBfvcLIMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [5.0, 6.29], [12.0, 15.38], [16.0, 29.2], [31.0, 39.78], [42.0, 58.65], [59.0, 62.5], [64.0, 102.51], [103.0, 103.98], [108.0, 117.31], [119.0, 120.66]], "keep_status": [false, false, true, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 28.02, 28.37, 31.79, 28.68, 28.73, 0.0, 0.0, 28.35, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.35], ["sound effect", 3.34], ["boom", 2.56]], [["music", 55.11], ["sound effect", 6.88], ["hum", 3.5]], [["throbbing", 40.15], ["hum", 22.53], ["mains hum", 19.03]], [["music", 40.94], ["hum", 7.51], ["mains hum", 6.41]], [["fly, housefly", 22.08], ["speech", 14.54], ["insect", 11.49]], null, null, [["hum", 25.79], ["mains hum", 16.15], ["music", 14.08]], null], "duration": [1.05, 1.29, 3.38, 13.2, 8.78, 16.65, 3.5, 38.51, 0.98, 9.31, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/jN_ftt-J7S8_filtered.json b/annotations_filtered/jN_ftt-J7S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2711be9d6e660c8cbb35fbe63983161838ec572 --- /dev/null +++ b/annotations_filtered/jN_ftt-J7S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 7.55], [12.0, 12.8], [17.0, 17.61], [18.0, 22.3], [26.0, 30.94], [32.0, 33.18], [39.0, 39.16], [40.0, 42.06], [43.0, 43.53], [47.0, 50.58], [51.0, 52.52], [53.0, 53.72], [56.0, 56.29], [60.0, 62.16], [65.0, 66.33], [69.0, 70.82], [74.0, 74.17], [75.0, 75.66], [78.0, 78.49], [83.0, 84.75], [86.0, 88.4], [91.0, 92.64], [93.0, 95.76], [98.0, 98.74], [102.0, 102.0], [102.0, 108.65], [110.0, 116.18], [119.0, 119.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 65.44, 0.0, 0.0, 54.3, 41.36, 0.0, 0.0, 79.24, 0.0, 61.27, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 83.34, 0.0, 0.0, 68.8, 80.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 46.57], ["fly, housefly", 8.22], ["insect", 6.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 2.55, 0.8, 0.61, 4.3, 4.94, 1.18, 0.16, 2.06, 0.53, 3.58, 1.52, 0.72, 0.29, 2.16, 1.33, 1.82, 0.17, 0.66, 0.49, 1.75, 2.4, 1.64, 2.76, 0.74, 0.0, 6.65, 6.18, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/jOLLiuCk420_filtered.json b/annotations_filtered/jOLLiuCk420_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..110f655b2345675a2714b2f3a4b5e6f1403d217b --- /dev/null +++ b/annotations_filtered/jOLLiuCk420_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 54.7], [56.0, 69.87], [71.0, 71.12], [72.0, 72.67], [76.0, 120.78], [126.0, 135.7]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 30.36, 0.0, 0.0, 0.0, 39.75], "audiomae_on_audioset": [null, [["music", 29.01], ["buzz", 20.62], ["rumble", 16.36]], null, null, null, [["music", 57.18], ["musical instrument", 8.02], ["brass instrument", 6.36]]], "duration": [48.7, 13.87, 0.12, 0.67, 44.78, 9.7]} \ No newline at end of file diff --git a/annotations_filtered/jP8dC8E6Emk_filtered.json b/annotations_filtered/jP8dC8E6Emk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74a400109a7c9e146d9f559884a3abe64096ab3d --- /dev/null +++ b/annotations_filtered/jP8dC8E6Emk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [6.0, 10.81], [13.0, 15.18], [17.0, 18.79], [22.0, 22.71], [24.0, 24.87], [26.0, 27.23], [34.0, 36.58], [39.0, 43.39]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.16, 50.61, 0.0, 0.0, 0.0, 0.0, 40.24, 40.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 84.52], ["ambient music", 4.72], ["synthesizer", 2.4]], [["music", 61.52], ["musical instrument", 5.35], ["mains hum", 4.93]]], "duration": [0.49, 4.81, 2.18, 1.79, 0.71, 0.87, 1.23, 2.58, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/jPF_mENo1Fw_filtered.json b/annotations_filtered/jPF_mENo1Fw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9477a434d926132633456281446762bd0f654fb4 --- /dev/null +++ b/annotations_filtered/jPF_mENo1Fw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.02], [20.0, 22.06], [24.0, 26.37], [27.0, 27.35], [29.0, 32.05], [34.0, 35.06], [36.0, 38.47], [45.0, 49.05], [50.0, 53.4], [54.0, 57.06], [63.0, 77.84], [79.0, 84.15], [86.0, 91.18], [92.0, 100.36], [102.0, 103.84], [105.0, 117.95], [122.0, 122.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 99.36, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 2.06, 2.37, 0.35, 3.05, 1.06, 2.47, 4.05, 3.4, 3.06, 14.84, 5.15, 5.18, 8.36, 1.84, 12.95, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/jPH8I5QWFUU_filtered.json b/annotations_filtered/jPH8I5QWFUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54c130451b48ba9ab3abb8c10f5bdf3901d9cb6a --- /dev/null +++ b/annotations_filtered/jPH8I5QWFUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.91], [26.0, 28.58], [31.0, 34.32], [35.0, 35.63], [36.0, 54.28], [56.0, 56.44], [65.0, 72.71], [75.0, 75.54], [79.0, 94.66]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [40.93, 58.64, 52.86, 0.0, 33.4, 0.0, 36.87, 0.0, 39.12], "audiomae_on_audioset": [[["music", 68.97], ["synthesizer", 4.01], ["musical instrument", 3.25]], null, null, null, [["music", 57.98], ["hum", 11.29], ["rumble", 4.96]], null, [["hum", 36.59], ["mains hum", 29.48], ["music", 13.1]], null, [["music", 74.67], ["musical instrument", 3.37], ["synthesizer", 2.78]]], "duration": [2.91, 2.58, 3.32, 0.63, 18.28, 0.44, 7.71, 0.54, 15.66]} \ No newline at end of file diff --git a/annotations_filtered/jPRiyRmsLBo_filtered.json b/annotations_filtered/jPRiyRmsLBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988571a8317384a7efa81a4e5b98f2f9dae06807 --- /dev/null +++ b/annotations_filtered/jPRiyRmsLBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [4.0, 4.19], [6.0, 6.59], [8.0, 8.24], [11.0, 13.02], [13.0, 15.18], [17.0, 19.48], [20.0, 20.56], [24.0, 24.81], [26.0, 26.49], [31.0, 31.46], [35.0, 35.92], [37.0, 41.03], [42.0, 47.16], [49.0, 50.58], [52.0, 52.69], [56.0, 56.94], [60.0, 61.28], [65.0, 66.06], [69.0, 69.16], [71.0, 72.22], [74.0, 75.05], [76.0, 77.16], [82.0, 82.98], [85.0, 86.02], [87.0, 88.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.0, 57.81, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 41.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 83.75], ["telephone", 5.7], ["radio", 1.96]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.19, 0.59, 0.24, 2.02, 2.18, 2.48, 0.56, 0.81, 0.49, 0.46, 0.92, 4.03, 5.16, 1.58, 0.69, 0.94, 1.28, 1.06, 0.16, 1.22, 1.05, 1.16, 0.98, 1.02, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/jPSjDk0CM68_filtered.json b/annotations_filtered/jPSjDk0CM68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..905502bf37b997d833a4a8d678c2a1ed3354fe42 --- /dev/null +++ b/annotations_filtered/jPSjDk0CM68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 28.44], [31.0, 31.48], [35.0, 93.29], [94.0, 94.8], [98.0, 99.15], [103.0, 104.11], [106.0, 106.39], [109.0, 110.29], [112.0, 112.78], [114.0, 114.32], [118.0, 118.52], [119.0, 121.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52], "audiomae_on_audioset": [[["music", 57.8], ["speech", 15.23], ["musical instrument", 4.53]], null, null, null, null, null, null, null, null, null, null, null], "duration": [13.44, 0.48, 58.29, 0.8, 1.15, 1.11, 0.39, 1.29, 0.78, 0.32, 0.52, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/jPf2y2QGoJw_filtered.json b/annotations_filtered/jPf2y2QGoJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e586898c4f35cb8c280b44ace915b3c428e3dbb --- /dev/null +++ b/annotations_filtered/jPf2y2QGoJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [4.0, 5.78], [7.0, 8.58], [10.0, 10.69], [12.0, 12.53], [13.0, 13.59], [15.0, 16.68], [26.0, 26.27], [37.0, 39.58], [43.0, 43.31], [44.0, 45.49], [46.0, 46.6], [49.0, 49.3], [51.0, 51.44], [55.0, 55.07], [57.0, 57.47], [64.0, 81.63], [82.0, 92.35], [94.0, 94.58], [97.0, 97.33], [98.0, 98.64], [99.0, 99.82], [102.0, 113.7], [120.0, 121.71], [124.0, 124.34], [125.0, 125.61], [128.0, 129.22], [130.0, 131.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.49, 93.45, 0.0, 0.0, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 70.85], ["speech", 6.88], ["effects unit", 3.34]], null, null, null, null, null, [["music", 38.18], ["speech", 23.81], ["tap", 10.69]], null, null, null, null, null], "duration": [0.07, 1.78, 1.58, 0.69, 0.53, 0.59, 1.68, 0.27, 2.58, 0.31, 1.49, 0.6, 0.3, 0.44, 0.07, 0.47, 17.63, 10.35, 0.58, 0.33, 0.64, 0.82, 11.7, 1.71, 0.34, 0.61, 1.22, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/jPfje0jZeMo_filtered.json b/annotations_filtered/jPfje0jZeMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73211c8aa9bc414532e4e3706cd8e01de75eb7c6 --- /dev/null +++ b/annotations_filtered/jPfje0jZeMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [8.0, 9.63], [22.0, 24.75], [32.0, 32.97], [42.0, 57.23], [59.0, 64.69], [66.0, 66.26], [67.0, 67.98], [70.0, 70.19], [72.0, 72.57], [77.0, 77.63], [79.0, 81.09], [88.0, 89.19], [93.0, 102.66], [106.0, 106.42], [108.0, 108.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.31, 0.0, 41.3, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 33.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 60.92], ["synthesizer", 11.63], ["musical instrument", 4.19]], null, [["music", 62.0], ["musical instrument", 8.8], ["theremin", 7.0]], null, null, null, null, null, null, null, null, [["music", 62.76], ["breaking", 5.97], ["speech", 5.88]], null, null], "duration": [1.97, 1.63, 2.75, 0.97, 15.23, 5.69, 0.26, 0.98, 0.19, 0.57, 0.63, 2.09, 1.19, 9.66, 0.42, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/jPgV4d4ZmZo_filtered.json b/annotations_filtered/jPgV4d4ZmZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3be9d245f41585fd9a23887ddd0d6b36e34075d6 --- /dev/null +++ b/annotations_filtered/jPgV4d4ZmZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.65], [10.0, 10.86], [13.0, 14.15], [22.0, 24.36], [26.0, 26.77], [28.0, 28.88], [31.0, 31.23], [36.0, 36.61], [37.0, 37.72], [40.0, 39.92], [42.0, 43.43], [44.0, 44.37], [45.0, 52.86], [54.0, 55.44], [57.0, 57.79], [59.0, 61.38], [68.0, 69.2], [72.0, 73.57], [77.0, 78.06], [82.0, 82.46], [93.0, 96.06], [102.0, 101.68], [103.0, 103.45], [112.0, 112.7], [114.0, 115.13], [121.0, 121.09], [125.0, 125.76], [126.0, 127.03], [128.0, 128.56], [130.0, 130.98], [132.0, 132.83], [133.0, 134.25], [136.0, 137.79], [138.0, 140.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.86, 1.15, 2.36, 0.77, 0.88, 0.23, 0.61, 0.72, -0.08, 1.43, 0.37, 7.86, 1.44, 0.79, 2.38, 1.2, 1.57, 1.06, 0.46, 3.06, -0.32, 0.45, 0.7, 1.13, 0.09, 0.76, 1.03, 0.56, 0.98, 0.83, 1.25, 1.79, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/jPsXJlylRvs_filtered.json b/annotations_filtered/jPsXJlylRvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa02179424571d9e2c40097e166f4ad2cef9f38 --- /dev/null +++ b/annotations_filtered/jPsXJlylRvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.82], [11.0, 11.15], [12.0, 13.31], [14.0, 15.23], [16.0, 18.57], [19.0, 20.22], [21.0, 21.39], [23.0, 23.16], [24.0, 32.83], [36.0, 37.35], [39.0, 40.91], [41.0, 42.21], [45.0, 50.38], [52.0, 52.49], [53.0, 53.38], [56.0, 55.97], [64.0, 64.25], [66.0, 67.19], [68.0, 68.3], [69.0, 69.85], [70.0, 71.2], [72.0, 73.06], [74.0, 74.34], [75.0, 76.13], [77.0, 77.01], [78.0, 78.49], [79.0, 80.69], [85.0, 85.99], [88.0, 88.13], [90.0, 92.92], [103.0, 104.79], [105.0, 106.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 34.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.08], ["hum", 10.24], ["synthesizer", 9.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 0.15, 1.31, 1.23, 2.57, 1.22, 0.39, 0.16, 8.83, 1.35, 1.91, 1.21, 5.38, 0.49, 0.38, -0.03, 0.25, 1.19, 0.3, 0.85, 1.2, 1.06, 0.34, 1.13, 0.01, 0.49, 1.69, 0.99, 0.13, 2.92, 1.79, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/jQ903giVNAg_filtered.json b/annotations_filtered/jQ903giVNAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9413fd481b1dc316e6493273d8a7df439e7a5efb --- /dev/null +++ b/annotations_filtered/jQ903giVNAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.36], [25.0, 25.29], [27.0, 27.58], [29.0, 30.32], [32.0, 32.93], [35.0, 36.71], [38.0, 39.07], [40.0, 40.34], [45.0, 46.06], [51.0, 52.07], [55.0, 55.58], [56.0, 56.35], [59.0, 59.51], [61.0, 61.74], [63.0, 64.02], [66.0, 66.9], [70.0, 70.41], [73.0, 74.12], [75.0, 75.63], [77.0, 77.62], [80.0, 80.57], [85.0, 86.04], [89.0, 89.78], [91.0, 92.01], [96.0, 95.91], [97.0, 98.64], [99.0, 100.04], [101.0, 102.64], [108.0, 108.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.29, 0.58, 1.32, 0.93, 1.71, 1.07, 0.34, 1.06, 1.07, 0.58, 0.35, 0.51, 0.74, 1.02, 0.9, 0.41, 1.12, 0.63, 0.62, 0.57, 1.04, 0.78, 1.01, -0.09, 1.64, 1.04, 1.64, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/jQKx2XTcd_I_filtered.json b/annotations_filtered/jQKx2XTcd_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fb45b69b5fc218d1558ed6bca3fe4333546185d --- /dev/null +++ b/annotations_filtered/jQKx2XTcd_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.1], [7.0, 17.61], [19.0, 19.72], [21.0, 22.05], [29.0, 32.81], [35.0, 43.44], [45.0, 49.52], [51.0, 56.42], [61.0, 65.7], [68.0, 70.93], [72.0, 72.64], [73.0, 75.25], [76.0, 80.6], [82.0, 109.56]], "keep_status": [false, false, false, false, true, false, true, false, true, true, false, true, false, false], "silence_prob": [0.0, 59.59, 0.0, 0.0, 38.12, 39.66, 33.16, 34.72, 31.69, 38.31, 0.0, 42.72, 51.99, 31.43], "audiomae_on_audioset": [null, null, null, null, [["speech", 32.33], ["music", 14.54], ["hum", 13.34]], [["fly, housefly", 52.14], ["insect", 13.73], ["speech", 9.54]], [["music", 24.45], ["speech", 15.4], ["thunk", 14.7]], [["music", 51.31], ["speech", 15.91], ["synthesizer", 5.55]], [["music", 36.91], ["throbbing", 9.37], ["hum", 9.25]], [["hum", 19.76], ["mains hum", 12.78], ["fart", 9.71]], null, [["music", 57.07], ["throbbing", 4.67], ["speech", 4.31]], null, [["music", 52.8], ["throbbing", 13.33], ["buzz", 5.01]]], "duration": [1.1, 10.61, 0.72, 1.05, 3.81, 8.44, 4.52, 5.42, 4.7, 2.93, 0.64, 2.25, 4.6, 27.56]} \ No newline at end of file diff --git a/annotations_filtered/jQp4IlURoNg_filtered.json b/annotations_filtered/jQp4IlURoNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00880e19c37de5037bf98b5c3b53303387b3046b --- /dev/null +++ b/annotations_filtered/jQp4IlURoNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 29.0], [40.0, 41.4], [44.0, 45.67], [56.0, 62.8], [65.0, 86.58], [94.0, 94.83], [96.0, 97.28], [100.0, 100.7], [102.0, 102.52], [104.0, 107.0], [116.0, 117.49], [125.0, 129.37], [133.0, 133.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.49, 0.0, 0.0, 31.84, 30.53, 0.0, 0.0, 0.0, 0.0, 33.04, 0.0, 37.33, 0.0], "audiomae_on_audioset": [[["music", 62.85], ["throbbing", 10.5], ["electronic music", 5.59]], null, null, [["music", 48.83], ["speech", 19.63], ["throbbing", 5.34]], [["music", 43.37], ["speech", 34.86], ["electronic music", 5.45]], null, null, null, null, [["music", 29.4], ["hum", 16.64], ["mains hum", 15.02]], null, [["moo", 42.93], ["cattle, bovinae", 29.04], ["livestock, farm animals, working animals", 13.68]], null], "duration": [22.0, 1.4, 1.67, 6.8, 21.58, 0.83, 1.28, 0.7, 0.52, 3.0, 1.49, 4.37, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/jR3JlEXdBIo_filtered.json b/annotations_filtered/jR3JlEXdBIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57b23b506213f49f6127cbfb6c8214923a8a3cc0 --- /dev/null +++ b/annotations_filtered/jR3JlEXdBIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.96], [18.0, 19.13], [22.0, 23.3], [27.0, 40.29], [40.0, 40.32], [42.0, 42.6], [54.0, 73.92], [76.0, 85.38], [93.0, 98.59], [108.0, 113.85], [116.0, 119.96], [121.0, 124.7], [128.0, 130.84], [132.0, 134.08], [139.0, 139.85], [140.0, 141.15], [147.0, 148.49], [150.0, 154.11], [156.0, 158.06], [161.0, 176.35], [176.0, 176.88], [178.0, 178.44]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [32.77, 0.0, 0.0, 31.12, 0.0, 0.0, 29.51, 32.43, 30.23, 35.76, 35.64, 39.17, 58.38, 78.89, 0.0, 0.0, 0.0, 32.27, 34.16, 29.26, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 36.39], ["thunk", 11.0], ["door", 6.61]], null, null, [["music", 71.68], ["didgeridoo", 4.86], ["speech", 2.54]], null, null, [["speech", 45.54], ["groan", 16.88], ["music", 5.98]], [["cattle, bovinae", 31.24], ["livestock, farm animals, working animals", 26.26], ["moo", 16.18]], [["hum", 21.29], ["speech", 19.29], ["music", 15.85]], [["hum", 47.56], ["music", 18.62], ["mains hum", 14.36]], [["music", 54.75], ["mains hum", 14.11], ["hum", 13.56]], [["speech", 69.78], ["vehicle", 4.79], ["snicker", 2.4]], null, null, null, null, null, [["grunt", 26.72], ["groan", 26.56], ["speech", 8.22]], [["music", 30.53], ["hum", 14.19], ["mains hum", 7.88]], [["music", 21.23], ["electric shaver, electric razor", 13.13], ["mains hum", 10.75]], null, null], "duration": [2.96, 1.13, 1.3, 13.29, 0.32, 0.6, 19.92, 9.38, 5.59, 5.85, 3.96, 3.7, 2.84, 2.08, 0.85, 1.15, 1.49, 4.11, 2.06, 15.35, 0.88, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/jRRY7zgE4K8_filtered.json b/annotations_filtered/jRRY7zgE4K8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f066f8cc6283b122ca6699236ca11c582da57d9 --- /dev/null +++ b/annotations_filtered/jRRY7zgE4K8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [4.0, 5.63], [6.0, 15.6], [21.0, 35.29], [39.0, 39.5], [45.0, 45.4], [47.0, 47.33], [48.0, 48.47], [49.0, 48.91], [49.0, 49.64], [51.0, 50.85], [53.0, 53.06], [54.0, 56.46], [58.0, 58.04], [60.0, 60.86], [69.0, 69.11], [72.0, 72.12], [74.0, 73.85], [77.0, 77.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.87, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.62], ["effects unit", 29.87], ["distortion", 5.62]], null, null, null, null, null, null, null, null, [["stomach rumble", 16.05], ["throbbing", 15.01], ["noise", 6.16]], null, null, null, null, null, null], "duration": [1.34, 1.63, 9.6, 14.29, 0.5, 0.4, 0.33, 0.47, -0.09, 0.64, -0.15, 0.06, 2.46, 0.04, 0.86, 0.11, 0.12, -0.15, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/jRSw_0zpNE8_filtered.json b/annotations_filtered/jRSw_0zpNE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae19ef4154956fc906428e188392ece9745e6568 --- /dev/null +++ b/annotations_filtered/jRSw_0zpNE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [5.0, 5.49], [6.0, 8.46], [9.0, 11.94], [13.0, 16.48], [17.0, 21.63], [22.0, 22.47], [23.0, 31.56], [33.0, 34.53], [36.0, 38.25], [40.0, 41.76], [43.0, 43.9], [45.0, 48.96], [50.0, 52.1], [54.0, 56.51], [57.0, 67.39], [71.0, 76.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.71, 100.0, 82.79, 100.0, 0.0, 99.84, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 76.2, 90.95, 49.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.24], ["singing bowl", 14.14], ["mains hum", 13.12]]], "duration": [0.77, 0.49, 2.46, 2.94, 3.48, 4.63, 0.47, 8.56, 1.53, 2.25, 1.76, 0.9, 3.96, 2.1, 2.51, 10.39, 5.5]} \ No newline at end of file diff --git a/annotations_filtered/jRYdVUtQs-8_filtered.json b/annotations_filtered/jRYdVUtQs-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f85b314c18643b2c631cf6f94007796045aceef --- /dev/null +++ b/annotations_filtered/jRYdVUtQs-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.81], [5.0, 5.73], [7.0, 14.81], [15.0, 47.9], [51.0, 52.68]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 41.18], ["music", 25.4], ["synthesizer", 7.08]], null, null], "duration": [1.81, 0.73, 7.81, 32.9, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/jR_kxdUm1bc_filtered.json b/annotations_filtered/jR_kxdUm1bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a84a86042a3e6eeb1b9169052e89bb4c991ff4f6 --- /dev/null +++ b/annotations_filtered/jR_kxdUm1bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 40.73], [41.0, 41.44], [41.0, 70.55], [73.0, 77.8], [79.0, 79.61], [80.0, 81.36], [82.0, 82.8]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [30.67, 0.0, 30.8, 31.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.34], ["speech", 18.11], ["electronic music", 5.56]], null, [["hum", 18.48], ["music", 15.08], ["mains hum", 14.58]], [["music", 42.16], ["sidetone", 30.68], ["speech", 7.69]], null, null, null], "duration": [22.73, 0.44, 29.55, 4.8, 0.61, 1.36, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/jS7XOEttewM_filtered.json b/annotations_filtered/jS7XOEttewM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1acc56376abe35c5c6bbcb48a2a776ab4c43589 --- /dev/null +++ b/annotations_filtered/jS7XOEttewM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 32.1], [32.0, 33.91], [35.0, 35.43], [35.0, 35.53], [36.0, 37.66], [39.0, 40.49], [44.0, 44.93], [45.0, 45.3], [47.0, 56.86], [57.0, 58.06], [69.0, 69.9], [72.0, 76.32], [77.0, 84.64], [93.0, 94.42], [96.0, 98.9], [105.0, 106.24], [106.0, 114.34], [115.0, 116.43], [119.0, 120.28], [123.0, 124.01], [127.0, 128.09], [137.0, 141.89], [146.0, 149.91], [152.0, 154.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [75.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 37.89, 53.4, 0.0, 81.89, 0.0, 49.31, 0.0, 0.0, 0.0, 0.0, 93.6, 95.51, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.02], ["livestock, farm animals, working animals", 6.19], ["animal", 4.13]], null, null, null, null, [["noise", 19.29], ["fly, housefly", 16.0], ["speech", 15.05]], null, null, null, null, null, null, null], "duration": [2.1, 1.91, 0.43, 0.53, 1.66, 1.49, 0.93, 0.3, 9.86, 1.06, 0.9, 4.32, 7.64, 1.42, 2.9, 1.24, 8.34, 1.43, 1.28, 1.01, 1.09, 4.89, 3.91, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/jSabMn5UXKo_filtered.json b/annotations_filtered/jSabMn5UXKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b5cb4c4c3a8764a44ab1c4d5072515d081f061 --- /dev/null +++ b/annotations_filtered/jSabMn5UXKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [10.0, 11.62], [20.0, 20.29], [25.0, 24.95], [27.0, 26.7], [36.0, 42.69], [44.0, 44.59], [49.0, 49.84], [65.0, 65.08], [69.0, 69.2], [74.0, 74.65], [75.0, 79.93], [86.0, 88.06], [92.0, 92.92], [94.0, 94.15], [95.0, 99.12], [108.0, 108.58], [111.0, 112.53], [115.0, 121.26], [123.0, 124.43], [126.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 47.82, 0.0, 0.0, 38.12, 0.0, 0.0, 42.46, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, [["music", 71.71], ["synthesizer", 3.52], ["reverberation", 2.67]], null, null, null, null, null, [["music", 75.69], ["synthesizer", 10.34], ["musical instrument", 3.92]], [["music", 54.64], ["didgeridoo", 10.65], ["musical instrument", 3.62]], null, null, [["music", 57.09], ["didgeridoo", 12.74], ["speech", 6.76]], null, null, [["music", 46.68], ["synthesizer", 9.7], ["speech", 5.83]], null, null], "duration": [0.45, 1.62, 0.29, -0.05, -0.3, 6.69, 0.59, 0.84, 0.08, 0.2, 0.65, 4.93, 2.06, 0.92, 0.15, 4.12, 0.58, 1.53, 6.26, 1.43, 3.07]} \ No newline at end of file diff --git a/annotations_filtered/jSidQZzJfcc_filtered.json b/annotations_filtered/jSidQZzJfcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..437f24fe237d22a1eaeecba03c84e23a68802444 --- /dev/null +++ b/annotations_filtered/jSidQZzJfcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.1], [26.0, 28.22], [41.0, 42.6], [45.0, 46.11], [49.0, 49.18], [50.0, 50.75], [51.0, 52.12], [86.0, 91.66], [94.0, 94.96], [99.0, 99.64], [102.0, 101.95], [102.0, 103.18], [111.0, 111.81], [116.0, 116.85], [119.0, 120.01], [125.0, 125.49], [127.0, 127.18], [136.0, 136.54], [137.0, 137.4], [138.0, 147.09], [148.0, 149.67], [150.0, 151.92], [154.0, 154.3], [157.0, 157.87], [159.0, 159.81], [161.0, 165.01]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 46.15, 0.0, 0.0, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.81, 0.0, 0.0, 0.0, 0.0, 0.0, 45.98], "audiomae_on_audioset": [null, [["music", 44.0], ["speech", 7.61], ["throbbing", 4.43]], null, null, null, null, null, [["speech", 45.34], ["music", 32.65], ["musical instrument", 1.81]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.26], ["music", 18.35], ["fly, housefly", 14.17]], null, null, null, null, null, [["music", 47.83], ["speech", 26.5], ["musical instrument", 2.25]]], "duration": [0.1, 2.22, 1.6, 1.11, 0.18, 0.75, 1.12, 5.66, 0.96, 0.64, -0.05, 1.18, 0.81, 0.85, 1.01, 0.49, 0.18, 0.54, 0.4, 9.09, 1.67, 1.92, 0.3, 0.87, 0.81, 4.01]} \ No newline at end of file diff --git a/annotations_filtered/jSnvLrw4YR0_filtered.json b/annotations_filtered/jSnvLrw4YR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54dbf40ec48cd467c882ffc7dc2c1e2be1060b4c --- /dev/null +++ b/annotations_filtered/jSnvLrw4YR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [8.0, 9.32], [12.0, 12.58], [17.0, 18.86], [33.0, 34.45], [36.0, 36.86], [42.0, 41.77], [48.0, 49.4], [52.0, 51.85], [56.0, 56.56], [65.0, 65.6], [70.0, 69.97], [73.0, 75.57], [77.0, 77.45], [79.0, 79.61], [80.0, 81.43], [83.0, 83.19], [85.0, 84.82], [92.0, 91.62], [96.0, 96.3], [102.0, 102.02], [103.0, 104.13], [107.0, 108.31], [110.0, 110.25], [114.0, 114.18], [117.0, 118.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.32, 0.58, 1.86, 1.45, 0.86, -0.23, 1.4, -0.15, 0.56, 0.6, -0.03, 2.57, 0.45, 0.61, 1.43, 0.19, -0.18, -0.38, 0.3, 0.02, 1.13, 1.31, 0.25, 0.18, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/jT8TUowrkLU_filtered.json b/annotations_filtered/jT8TUowrkLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..881999f5a2e0e8d04906a9922af9cacb5a7dcc67 --- /dev/null +++ b/annotations_filtered/jT8TUowrkLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 46.08], [48.0, 71.02], [73.0, 86.32]], "keep_status": [false, false, true], "silence_prob": [30.1, 33.32, 32.09], "audiomae_on_audioset": [[["music", 63.49], ["musical instrument", 4.48], ["didgeridoo", 4.0]], [["music", 62.63], ["theremin", 7.87], ["synthesizer", 4.12]], [["speech", 36.21], ["music", 23.06], ["fart", 8.62]]], "duration": [17.08, 23.02, 13.32]} \ No newline at end of file diff --git a/annotations_filtered/jTHFCMuIrzQ_filtered.json b/annotations_filtered/jTHFCMuIrzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..301d8902796e90fdd4a75f6bea426e299618c47e --- /dev/null +++ b/annotations_filtered/jTHFCMuIrzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.37], [20.0, 20.29], [22.0, 22.13], [23.0, 26.11], [28.0, 29.2], [30.0, 32.39], [39.0, 39.6], [45.0, 46.6], [48.0, 48.64], [50.0, 51.76], [52.0, 53.91], [56.0, 58.09], [60.0, 60.4], [61.0, 61.33], [66.0, 67.1], [67.0, 70.23], [73.0, 77.75], [80.0, 81.87], [84.0, 84.87], [86.0, 87.79], [89.0, 89.21], [90.0, 91.96], [93.0, 93.51], [94.0, 96.25], [97.0, 98.19], [99.0, 99.71], [101.0, 102.22], [105.0, 107.03], [108.0, 109.73], [111.0, 118.39], [119.0, 120.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.22, 0.0, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 74.29, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 86.82, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.64], ["cattle, bovinae", 7.77], ["music", 6.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.29, 0.13, 3.11, 1.2, 2.39, 0.6, 1.6, 0.64, 1.76, 1.91, 2.09, 0.4, 0.33, 1.1, 3.23, 4.75, 1.87, 0.87, 1.79, 0.21, 1.96, 0.51, 2.25, 1.19, 0.71, 1.22, 2.03, 1.73, 7.39, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/jTRa22j4OUk_filtered.json b/annotations_filtered/jTRa22j4OUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3836b496e84bdce6629bad318fa1fb6d7575a0 --- /dev/null +++ b/annotations_filtered/jTRa22j4OUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.83], [17.0, 19.47], [21.0, 22.13], [27.0, 27.14], [37.0, 36.68], [39.0, 39.04], [41.0, 41.62], [47.0, 53.6], [58.0, 60.2], [61.0, 61.87], [63.0, 72.44], [73.0, 76.77], [77.0, 76.84], [77.0, 78.7]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 33.85, 0.0, 54.3, 52.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["frog", 19.14], ["groan", 16.75], ["insect", 6.94]], [["whale vocalization", 75.58], ["animal", 2.94], ["effects unit", 1.72]], null, null, null, null, null], "duration": [-0.17, 2.47, 1.13, 0.14, -0.32, 0.04, 0.62, 6.6, 2.2, 0.87, 9.44, 3.77, -0.16, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/jTkt23CfSp4_filtered.json b/annotations_filtered/jTkt23CfSp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..104b50538a4071c9f30e938a82a384e3e5595a87 --- /dev/null +++ b/annotations_filtered/jTkt23CfSp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.49], [38.0, 39.11], [40.0, 48.41], [52.0, 53.82], [62.0, 63.63], [64.0, 65.15], [71.0, 73.3], [83.0, 85.68], [88.0, 89.24], [90.0, 95.25], [98.0, 98.36], [102.0, 103.69], [105.0, 105.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.19, 0.0, 0.0, 0.0, 68.02, 100.0, 0.0, 46.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mosquito", 52.61], ["fly, housefly", 28.7], ["insect", 6.69]], null, null, null, null, null, null, [["fart", 26.67], ["speech", 22.7], ["noise", 20.3]], null, null, null], "duration": [0.49, 1.11, 8.41, 1.82, 1.63, 1.15, 2.3, 2.68, 1.24, 5.25, 0.36, 1.69, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/jTtTZjp9ViQ_filtered.json b/annotations_filtered/jTtTZjp9ViQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a636690b358af500b52c3a62cf6c46abb74f541 --- /dev/null +++ b/annotations_filtered/jTtTZjp9ViQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [7.0, 9.58], [10.0, 19.89], [21.0, 35.88], [37.0, 44.44], [45.0, 46.41], [47.0, 47.44], [50.0, 104.41], [106.0, 111.75]], "keep_status": [false, true, false, true, true, false, false, false, false], "silence_prob": [95.91, 32.3, 34.37, 38.32, 33.52, 0.0, 0.0, 0.0, 31.25], "audiomae_on_audioset": [null, [["music", 45.96], ["musical instrument", 7.46], ["reverberation", 6.5]], [["music", 46.79], ["speech", 27.62], ["synthesizer", 4.52]], [["music", 56.45], ["hum", 5.64], ["speech", 5.25]], [["music", 49.04], ["hum", 6.61], ["synthesizer", 5.94]], null, null, null, [["speech", 47.41], ["music", 33.71], ["outside, rural or natural", 1.75]]], "duration": [2.02, 2.58, 9.89, 14.88, 7.44, 1.41, 0.44, 54.41, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/jTz_VNAGqog_filtered.json b/annotations_filtered/jTz_VNAGqog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3edc13eb9f398236a4f38c286e86ca1c7f2964c8 --- /dev/null +++ b/annotations_filtered/jTz_VNAGqog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.35], [12.0, 15.4], [19.0, 20.01], [21.0, 33.96], [34.0, 34.47], [35.0, 34.94], [36.0, 36.41], [37.0, 41.57], [43.0, 43.36], [48.0, 51.98], [56.0, 56.05], [57.0, 57.28], [58.0, 58.62], [59.0, 70.78], [73.0, 73.52], [82.0, 87.81], [93.0, 94.02], [96.0, 97.17], [100.0, 100.28], [102.0, 108.09], [110.0, 111.84], [114.0, 114.66], [115.0, 116.28], [119.0, 123.77], [126.0, 127.14], [130.0, 130.27], [132.0, 132.43], [134.0, 134.13], [140.0, 140.12], [141.0, 141.03], [145.0, 145.81], [147.0, 147.53], [149.0, 149.82]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.18, 0.0, 42.26, 0.0, 0.0, 0.0, 41.14, 0.0, 35.91, 0.0, 0.0, 0.0, 32.78, 0.0, 37.27, 0.0, 0.0, 0.0, 47.35, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.08], ["glockenspiel", 11.24], ["mallet percussion", 10.46]], null, null, null, [["music", 44.8], ["wind instrument, woodwind instrument", 19.75], ["musical instrument", 5.32]], null, [["music", 41.45], ["musical instrument", 6.72], ["didgeridoo", 5.42]], null, null, null, [["wind instrument, woodwind instrument", 26.84], ["music", 24.69], ["harmonica", 20.37]], null, [["mains hum", 34.12], ["music", 22.21], ["hum", 22.15]], null, null, null, [["music", 35.83], ["tick-tock", 10.58], ["musical instrument", 6.42]], null, null, null, [["music", 68.03], ["theremin", 13.83], ["musical instrument", 1.92]], null, null, null, null, null, null, null, null, null], "duration": [0.35, 3.4, 1.01, 12.96, 0.47, -0.06, 0.41, 4.57, 0.36, 3.98, 0.05, 0.28, 0.62, 11.78, 0.52, 5.81, 1.02, 1.17, 0.28, 6.09, 1.84, 0.66, 1.28, 4.77, 1.14, 0.27, 0.43, 0.13, 0.12, 0.03, 0.81, 0.53, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/jU6nB-uJh68_filtered.json b/annotations_filtered/jU6nB-uJh68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48cda1da01b53e3c90ae1847866274c790fbb35c --- /dev/null +++ b/annotations_filtered/jU6nB-uJh68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 5.1], [6.0, 6.64], [9.0, 9.15], [12.0, 11.96], [14.0, 14.72], [20.0, 24.73], [26.0, 26.08], [26.0, 27.77], [29.0, 30.72], [32.0, 32.56], [35.0, 36.14], [37.0, 38.89], [40.0, 39.95], [42.0, 45.08], [46.0, 46.2], [48.0, 48.47], [52.0, 52.91], [58.0, 63.44], [64.0, 67.64], [68.0, 68.69], [69.0, 69.67], [72.0, 73.35], [74.0, 75.78], [77.0, 77.33], [79.0, 79.76], [82.0, 82.16], [88.0, 88.13], [94.0, 94.76], [97.0, 96.84], [107.0, 108.4], [110.0, 111.47], [112.0, 113.26], [115.0, 115.75], [118.0, 129.54], [131.0, 153.67], [155.0, 155.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 37.93, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.35, 36.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 45.26], ["insect", 30.21], ["mosquito", 4.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 17.65], ["cattle, bovinae", 15.66], ["speech", 14.92]], [["cattle, bovinae", 34.57], ["moo", 30.72], ["livestock, farm animals, working animals", 26.54]], null], "duration": [1.21, 1.1, 0.64, 0.15, -0.04, 0.72, 4.73, 0.08, 1.77, 1.72, 0.56, 1.14, 1.89, -0.05, 3.08, 0.2, 0.47, 0.91, 5.44, 3.64, 0.69, 0.67, 1.35, 1.78, 0.33, 0.76, 0.16, 0.13, 0.76, -0.16, 1.4, 1.47, 1.26, 0.75, 11.54, 22.67, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/jUYCTHwAQvw_filtered.json b/annotations_filtered/jUYCTHwAQvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8c5d9a79697fb27a2df9975d0abffee7b8d4956 --- /dev/null +++ b/annotations_filtered/jUYCTHwAQvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 32.37], [36.0, 73.84], [76.0, 76.59], [88.0, 90.22], [91.0, 94.15], [95.0, 97.53], [100.0, 99.84], [100.0, 100.62], [102.0, 121.95]], "keep_status": [false, false, false, true, true, true, false, false, true], "silence_prob": [31.47, 0.0, 0.0, 39.17, 37.44, 35.74, 0.0, 0.0, 29.74], "audiomae_on_audioset": [[["throbbing", 49.35], ["hum", 36.93], ["music", 3.91]], null, null, [["whale vocalization", 19.25], ["throbbing", 12.68], ["hum", 8.9]], [["breaking", 35.86], ["speech", 14.23], ["hum", 4.96]], [["speech", 19.41], ["eruption", 9.16], ["hum", 6.97]], null, null, [["speech", 19.35], ["explosion", 12.83], ["music", 8.85]]], "duration": [2.37, 37.84, 0.59, 2.22, 3.15, 2.53, -0.16, 0.62, 19.95]} \ No newline at end of file diff --git a/annotations_filtered/jUcER281BOg_filtered.json b/annotations_filtered/jUcER281BOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a37b6876f6da6e3483a90bfc5211b8092a1840e7 --- /dev/null +++ b/annotations_filtered/jUcER281BOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [4.0, 4.53], [5.0, 6.71], [9.0, 10.07], [12.0, 12.38], [15.0, 16.34], [19.0, 22.98], [24.0, 24.98], [26.0, 29.12], [31.0, 37.47], [39.0, 39.48], [41.0, 41.07], [44.0, 45.3], [47.0, 47.93], [54.0, 53.59], [54.0, 55.46], [56.0, 57.05], [59.0, 59.32], [62.0, 70.97], [72.0, 73.01], [75.0, 78.14], [80.0, 80.92], [82.0, 82.43], [83.0, 86.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 87.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.53, 1.71, 1.07, 0.38, 1.34, 3.98, 0.98, 3.12, 6.47, 0.48, 0.07, 1.3, 0.93, -0.41, 1.46, 1.05, 0.32, 8.97, 1.01, 3.14, 0.92, 0.43, 3.48]} \ No newline at end of file diff --git a/annotations_filtered/jUkqho3OUos_filtered.json b/annotations_filtered/jUkqho3OUos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..071aa5d56b560ce6918e1313efbe97365aad58bd --- /dev/null +++ b/annotations_filtered/jUkqho3OUos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.4], [6.0, 5.83], [13.0, 16.33], [20.0, 20.82], [39.0, 39.6], [40.0, 40.8], [76.0, 76.94], [95.0, 95.44]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [99.36, 0.0, 43.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["frog", 14.83], ["radio", 9.8], ["wheeze", 7.11]], null, null, null, null, null], "duration": [3.4, -0.17, 3.33, 0.82, 0.6, 0.8, 0.94, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/jVGNdB6iEeA_filtered.json b/annotations_filtered/jVGNdB6iEeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5eec2eae92f214cc60fe9aa03f6b213e5d0c7b1c --- /dev/null +++ b/annotations_filtered/jVGNdB6iEeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [9.0, 9.93], [13.0, 15.11], [18.0, 20.8], [65.0, 69.01], [83.0, 83.98], [91.0, 91.74], [94.0, 94.42], [112.0, 113.14], [113.0, 114.99], [132.0, 133.54], [146.0, 146.47], [148.0, 155.8], [185.0, 186.83], [204.0, 205.11], [208.0, 213.44], [214.0, 213.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.86, 95.91, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.92, 0.0, 0.0, 40.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.33], ["theremin", 2.26], ["musical instrument", 2.13]], null, null, [["music", 60.8], ["clarinet", 6.97], ["musical instrument", 3.68]], null], "duration": [0.62, 0.93, 2.11, 2.8, 4.01, 0.98, 0.74, 0.42, 1.14, 1.99, 1.54, 0.47, 7.8, 1.83, 1.11, 5.44, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/jVGX-_Iodwc_filtered.json b/annotations_filtered/jVGX-_Iodwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6252673b90248c1cadee2273796e1f454cea808 --- /dev/null +++ b/annotations_filtered/jVGX-_Iodwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.03], [6.0, 6.66], [37.0, 37.3], [42.0, 43.63], [52.0, 62.83], [74.0, 74.75], [76.0, 77.18], [78.0, 78.48], [81.0, 86.51], [92.0, 93.87], [99.0, 99.89], [102.0, 109.43], [112.0, 112.11], [114.0, 116.9], [117.0, 116.94], [117.0, 145.1], [162.0, 170.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.62, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 31.48, 0.0, 30.36, 0.0, 29.98, 34.93], "audiomae_on_audioset": [null, null, null, null, [["music", 83.06], ["guitar", 1.5], ["singing", 1.41]], null, null, null, [["music", 46.44], ["sidetone", 36.36], ["electronic music", 3.94]], null, null, [["music", 72.09], ["speech", 7.62], ["boing", 2.78]], null, [["music", 64.11], ["musical instrument", 4.66], ["throbbing", 4.51]], null, [["music", 68.88], ["buzz", 7.89], ["didgeridoo", 3.15]], [["throbbing", 52.05], ["hum", 32.48], ["music", 9.53]]], "duration": [1.03, 0.66, 0.3, 1.63, 10.83, 0.75, 1.18, 0.48, 5.51, 1.87, 0.89, 7.43, 0.11, 2.9, -0.06, 28.1, 8.9]} \ No newline at end of file diff --git a/annotations_filtered/jVH_NN7phnA_filtered.json b/annotations_filtered/jVH_NN7phnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..829ed704ecf60fc857054b8965abc7eafbaba49c --- /dev/null +++ b/annotations_filtered/jVH_NN7phnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [10.0, 10.13], [15.0, 15.36], [23.0, 24.76], [28.0, 28.65], [37.0, 36.9], [44.0, 44.34], [49.0, 48.74], [54.0, 54.03], [55.0, 57.86], [59.0, 59.12], [61.0, 61.67], [65.0, 65.3], [71.0, 71.29], [81.0, 80.77], [84.0, 84.43], [88.0, 88.79], [90.0, 90.49], [91.0, 95.52], [97.0, 97.44], [100.0, 100.4], [101.0, 101.98], [107.0, 108.36], [109.0, 111.82], [117.0, 117.54], [118.0, 118.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 35.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 25.2], ["bark", 18.16], ["domestic animals, pets", 10.16]], null, null], "duration": [-0.09, 0.13, 0.36, 1.76, 0.65, -0.1, 0.34, -0.26, 0.03, 2.86, 0.12, 0.67, 0.3, 0.29, -0.23, 0.43, 0.79, 0.49, 4.52, 0.44, 0.4, 0.98, 1.36, 2.82, 0.54, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/jVjq_m-PWSQ_filtered.json b/annotations_filtered/jVjq_m-PWSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87f97967025066bc5d5c54c329ed7b4e6cc85a30 --- /dev/null +++ b/annotations_filtered/jVjq_m-PWSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 7.4], [8.0, 8.8], [12.0, 12.21], [14.0, 14.2], [15.0, 15.7], [17.0, 17.14], [18.0, 18.49], [19.0, 21.24], [22.0, 30.21], [32.0, 32.21], [33.0, 33.88], [37.0, 37.45], [39.0, 39.14], [43.0, 45.13], [47.0, 49.64], [51.0, 51.36], [53.0, 65.45], [66.0, 76.98], [78.0, 78.22], [80.0, 81.23], [82.0, 83.13], [84.0, 92.94], [94.0, 93.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 87.55, 0.0, 0.0, 0.0, 0.0, 43.1, 99.36, 0.0, 92.31, 67.38, 0.0, 0.0, 0.0, 87.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 19.48], ["moo", 13.15], ["cattle, bovinae", 8.76]], null, null, null, null, null, null, null, null, null], "duration": [7.4, 0.8, 0.21, 0.2, 0.7, 0.14, 0.49, 2.24, 8.21, 0.21, 0.88, 0.45, 0.14, 2.13, 2.64, 0.36, 12.45, 10.98, 0.22, 1.23, 1.13, 8.94, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/jVsXMF9sbVQ_filtered.json b/annotations_filtered/jVsXMF9sbVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f373d4bba0c705461a5fc10f14823aac74e3216f --- /dev/null +++ b/annotations_filtered/jVsXMF9sbVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 26.05], [28.0, 43.8], [45.0, 45.25], [46.0, 45.98], [47.0, 48.2], [50.0, 50.84], [51.0, 51.61], [54.0, 60.37], [61.0, 62.21], [63.0, 63.76], [68.0, 68.39], [69.0, 69.65], [71.0, 71.37], [72.0, 72.59], [74.0, 74.26], [76.0, 77.84], [78.0, 89.61], [96.0, 96.28], [100.0, 100.18], [101.0, 101.24], [103.0, 102.98], [120.0, 120.6], [124.0, 124.73], [129.0, 129.73]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.22, 35.71, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["theremin", 75.65], ["music", 16.93], ["musical instrument", 2.23]], [["explosion", 28.04], ["eruption", 17.59], ["hum", 14.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.05, 15.8, 0.25, -0.02, 1.2, 0.84, 0.61, 6.37, 1.21, 0.76, 0.39, 0.65, 0.37, 0.59, 0.26, 1.84, 11.61, 0.28, 0.18, 0.24, -0.02, 0.6, 0.73, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/jVu_cuFHZnc_filtered.json b/annotations_filtered/jVu_cuFHZnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..260c56405c09768b68efb7ab6e63e9a2dcd34c5f --- /dev/null +++ b/annotations_filtered/jVu_cuFHZnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [6.0, 6.42], [9.0, 9.58], [12.0, 12.39], [13.0, 13.85], [16.0, 16.48], [24.0, 25.95], [28.0, 34.28], [40.0, 45.82], [48.0, 51.39], [52.0, 53.28], [54.0, 55.98], [57.0, 58.58], [60.0, 60.61], [64.0, 65.16], [68.0, 68.82], [71.0, 71.86], [74.0, 76.77], [77.0, 79.76], [82.0, 82.93], [85.0, 86.31], [89.0, 90.1], [93.0, 95.23], [96.0, 97.24], [98.0, 99.62], [100.0, 101.11], [102.0, 102.93], [107.0, 108.55], [110.0, 113.24], [115.0, 116.48], [117.0, 117.36], [123.0, 124.36], [128.0, 127.77], [129.0, 129.83], [132.0, 132.53], [133.0, 133.08], [134.0, 136.11], [137.0, 138.99], [140.0, 140.88], [143.0, 143.31]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.08, 40.14, 38.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 49.5, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.08], ["ambient music", 15.46], ["hum", 6.67]], [["music", 59.79], ["ambient music", 19.69], ["gong", 2.09]], [["music", 48.3], ["harmonic", 5.09], ["ambient music", 4.55]], null, null, null, null, null, null, null, null, [["music", 29.92], ["effects unit", 3.71], ["musical instrument", 3.23]], null, null, null, null, null, null, null, null, null, [["music", 50.21], ["ambient music", 15.93], ["singing bowl", 5.29]], null, null, null, null, null, null, null, [["speech", 77.69], ["telephone", 8.83], ["sidetone", 3.96]], null, null, null], "duration": [1.33, 0.42, 0.58, 0.39, 0.85, 0.48, 1.95, 6.28, 5.82, 3.39, 1.28, 1.98, 1.58, 0.61, 1.16, 0.82, 0.86, 2.77, 2.76, 0.93, 1.31, 1.1, 2.23, 1.24, 1.62, 1.11, 0.93, 1.55, 3.24, 1.48, 0.36, 1.36, -0.23, 0.83, 0.53, 0.08, 2.11, 1.99, 0.88, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/jVxyX7FcS4Q_filtered.json b/annotations_filtered/jVxyX7FcS4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4400cbe8e26a1fe4497a962263494e839968fd57 --- /dev/null +++ b/annotations_filtered/jVxyX7FcS4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [4.0, 9.46], [10.0, 10.44], [12.0, 12.14], [13.0, 19.04], [20.0, 20.11], [22.0, 23.62], [24.0, 25.22], [26.0, 27.99], [29.0, 30.05], [31.0, 34.6], [36.0, 37.71], [39.0, 41.44], [44.0, 45.01], [50.0, 49.89], [52.0, 53.4], [60.0, 59.8], [61.0, 67.0], [68.0, 71.22], [76.0, 77.89], [79.0, 80.62], [82.0, 82.65], [84.0, 84.87], [86.0, 86.76], [88.0, 89.26], [91.0, 91.64], [93.0, 92.99], [94.0, 95.13], [96.0, 99.0], [102.0, 102.02], [103.0, 104.67], [105.0, 106.35], [107.0, 107.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.35, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 98.99, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 5.46, 0.44, 0.14, 6.04, 0.11, 1.62, 1.22, 1.99, 1.05, 3.6, 1.71, 2.44, 1.01, -0.11, 1.4, -0.2, 6.0, 3.22, 1.89, 1.62, 0.65, 0.87, 0.76, 1.26, 0.64, -0.01, 1.13, 3.0, 0.02, 1.67, 1.35, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/jW1CeAVPhVg_filtered.json b/annotations_filtered/jW1CeAVPhVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae8d2413551cfeee7e7697a831c70632aa4249d1 --- /dev/null +++ b/annotations_filtered/jW1CeAVPhVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [2.0, 42.36], [45.0, 45.42], [46.0, 62.23], [63.0, 63.63], [64.0, 71.19], [71.0, 100.79], [101.0, 103.25], [105.0, 112.87]], "keep_status": [false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 33.76, 0.0, 34.69, 32.72, 34.46, 31.35], "audiomae_on_audioset": [null, null, null, [["speech", 46.66], ["music", 13.51], ["buzz", 6.69]], null, [["speech", 34.6], ["music", 28.24], ["trombone", 6.17]], [["speech", 49.49], ["music", 21.84], ["electronic music", 2.29]], [["mains hum", 13.77], ["hum", 13.15], ["buzzer", 11.2]], [["speech", 37.26], ["music", 21.23], ["vehicle", 8.48]]], "duration": [0.36, 40.36, 0.42, 16.23, 0.63, 7.19, 29.79, 2.25, 7.87]} \ No newline at end of file diff --git a/annotations_filtered/jW2zOdceqr8_filtered.json b/annotations_filtered/jW2zOdceqr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a029933b2008a5c6c73a440589bac034048f8b4 --- /dev/null +++ b/annotations_filtered/jW2zOdceqr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.87], [20.0, 20.95], [22.0, 40.96], [44.0, 45.45], [49.0, 50.03], [51.0, 52.08], [56.0, 64.15], [65.0, 66.31], [68.0, 86.22], [87.0, 145.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 34.01, 0.0, 0.0, 0.0, 31.06, 0.0, 31.03, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.48], ["musical instrument", 6.7], ["didgeridoo", 3.94]], null, null, null, [["throbbing", 24.38], ["speech", 21.64], ["music", 20.3]], null, [["music", 40.26], ["throbbing", 36.77], ["hum", 9.91]], null], "duration": [0.87, 0.95, 18.96, 1.45, 1.03, 1.08, 8.15, 1.31, 18.22, 58.56]} \ No newline at end of file diff --git a/annotations_filtered/jWHcIO4y8kk_filtered.json b/annotations_filtered/jWHcIO4y8kk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65b617aebb7e0580fc5c7886fb1f33ed298f2435 --- /dev/null +++ b/annotations_filtered/jWHcIO4y8kk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [25.0, 24.92], [30.0, 31.48], [36.0, 36.04], [39.0, 40.19], [41.0, 41.47], [49.0, 54.26], [57.0, 57.28], [65.0, 66.12], [71.0, 71.88], [81.0, 80.92], [90.0, 92.91], [97.0, 96.58], [98.0, 98.88], [102.0, 102.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, -0.08, 1.48, 0.04, 1.19, 0.47, 5.26, 0.28, 1.12, 0.88, -0.08, 2.91, -0.42, 0.88, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/jWJqzIUntho_filtered.json b/annotations_filtered/jWJqzIUntho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f5c40e07960d2271279c0bf2869d1a17ed0df91 --- /dev/null +++ b/annotations_filtered/jWJqzIUntho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [7.0, 7.57], [11.0, 11.67], [18.0, 17.85], [21.0, 21.95], [24.0, 24.22], [26.0, 27.38], [30.0, 29.83], [34.0, 35.53], [36.0, 36.96], [39.0, 39.73], [45.0, 47.19], [48.0, 50.31], [52.0, 54.8], [55.0, 57.47], [59.0, 61.45], [63.0, 67.74], [69.0, 72.08], [74.0, 76.65], [80.0, 80.6], [83.0, 83.51], [86.0, 86.59], [90.0, 90.14], [92.0, 92.37], [94.0, 94.83], [97.0, 97.82], [99.0, 99.1], [100.0, 107.16], [109.0, 109.41], [110.0, 111.74], [115.0, 115.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 79.76, 99.88, 99.56, 99.99, 99.87, 99.71, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 0.57, 0.67, -0.15, 0.95, 0.22, 1.38, -0.17, 1.53, 0.96, 0.73, 2.19, 2.31, 2.8, 2.47, 2.45, 4.74, 3.08, 2.65, 0.6, 0.51, 0.59, 0.14, 0.37, 0.83, 0.82, 0.1, 7.16, 0.41, 1.74, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/jWQ1ITS94cA_filtered.json b/annotations_filtered/jWQ1ITS94cA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a677cada4448c40ff6f23b9bde67c3fa00969af3 --- /dev/null +++ b/annotations_filtered/jWQ1ITS94cA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.5], [15.0, 16.09], [17.0, 17.59], [21.0, 24.76], [28.0, 28.24], [31.0, 32.04], [45.0, 45.84], [57.0, 57.67], [58.0, 58.92], [66.0, 66.97], [68.0, 69.04], [71.0, 72.06], [73.0, 74.78], [75.0, 75.76], [85.0, 85.43], [88.0, 88.26], [91.0, 92.25], [94.0, 98.73], [101.0, 113.58], [115.0, 115.69], [122.0, 122.81], [124.0, 126.01], [127.0, 127.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 48.48, 0.0, 0.0, 79.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 66.02], ["hum", 11.05], ["telephone dialing, dtmf", 8.74]], null, null, null, null], "duration": [1.5, 1.09, 0.59, 3.76, 0.24, 1.04, 0.84, 0.67, 0.92, 0.97, 1.04, 1.06, 1.78, 0.76, 0.43, 0.26, 1.25, 4.73, 12.58, 0.69, 0.81, 2.01, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/jWt7wiLImmU_filtered.json b/annotations_filtered/jWt7wiLImmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1daac1365c6ad863381c52da84027100700fece3 --- /dev/null +++ b/annotations_filtered/jWt7wiLImmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.3], [19.0, 19.47], [33.0, 34.4], [40.0, 41.05], [44.0, 44.51], [45.0, 45.77], [50.0, 50.68], [51.0, 51.78], [57.0, 57.4], [62.0, 62.55], [63.0, 63.9], [66.0, 68.69], [70.0, 70.17], [72.0, 71.61], [72.0, 72.67], [76.0, 79.24], [81.0, 81.68], [82.0, 82.63], [88.0, 88.65], [92.0, 92.87], [94.0, 94.02], [95.0, 95.47], [98.0, 99.25], [101.0, 101.97], [103.0, 104.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 31.55], ["fly, housefly", 30.85], ["insect", 14.84]], null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.47, 1.4, 1.05, 0.51, 0.77, 0.68, 0.78, 0.4, 0.55, 0.9, 2.69, 0.17, -0.39, 0.67, 3.24, 0.68, 0.63, 0.65, 0.87, 0.02, 0.47, 1.25, 0.97, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/jWyeugspkUA_filtered.json b/annotations_filtered/jWyeugspkUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5c322824ff2f7207874178c6cfc52a3c5d256f7 --- /dev/null +++ b/annotations_filtered/jWyeugspkUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.59], [6.0, 7.4], [14.0, 16.24], [20.0, 19.97], [24.0, 23.89], [33.0, 47.46], [52.0, 74.8], [77.0, 94.56], [98.0, 108.28], [109.0, 109.71], [110.0, 111.45]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 42.28, 0.0, 0.0, 32.14, 32.61, 32.83, 31.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["theremin", 40.49], ["music", 30.31], ["creak", 4.39]], null, null, [["music", 49.08], ["didgeridoo", 11.37], ["speech", 9.17]], [["fly, housefly", 24.78], ["groan", 12.46], ["whack, thwack", 11.61]], [["music", 19.51], ["fart", 11.32], ["speech", 10.82]], [["music", 42.92], ["whale vocalization", 5.57], ["livestock, farm animals, working animals", 4.65]], null, null], "duration": [-0.41, 1.4, 2.24, -0.03, -0.11, 14.46, 22.8, 17.56, 10.28, 0.71, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/jX09Cesfxo8_filtered.json b/annotations_filtered/jX09Cesfxo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbdc4e3c5f111e37036de0851df5bbf4b24e945a --- /dev/null +++ b/annotations_filtered/jX09Cesfxo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.8], [17.0, 18.4], [19.0, 29.96], [31.0, 31.56], [35.0, 46.67], [47.0, 64.88]], "keep_status": [false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 76.86, 0.0, 33.92, 33.58], "audiomae_on_audioset": [null, null, null, null, [["music", 44.15], ["boing", 11.0], ["whack, thwack", 7.48]], [["music", 28.52], ["speech", 26.95], ["didgeridoo", 13.91]]], "duration": [1.8, 1.4, 10.96, 0.56, 11.67, 17.88]} \ No newline at end of file diff --git a/annotations_filtered/jXA-4rN9-ds_filtered.json b/annotations_filtered/jXA-4rN9-ds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35805a54c4242ccd185b41fd45d2611a0f8c4553 --- /dev/null +++ b/annotations_filtered/jXA-4rN9-ds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.61], [4.0, 28.95], [34.0, 92.64], [93.0, 107.69], [109.0, 109.93], [111.0, 111.11], [114.0, 113.58], [114.0, 114.93]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 31.03, 0.0, 31.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.21], ["mosquito", 12.13], ["fly, housefly", 6.06]], null, [["speech", 43.9], ["whack, thwack", 5.99], ["music", 5.1]], null, null, null, null], "duration": [1.61, 24.95, 58.64, 14.69, 0.93, 0.11, -0.42, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/jXGV-MT-TmU_filtered.json b/annotations_filtered/jXGV-MT-TmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3bbfb812e6f4b5b636555ebcf0508337147cd58 --- /dev/null +++ b/annotations_filtered/jXGV-MT-TmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [6.0, 6.52], [8.0, 10.2], [13.0, 14.5], [17.0, 21.34], [23.0, 24.17], [26.0, 27.62], [29.0, 30.48], [32.0, 52.14], [53.0, 53.64], [55.0, 56.0], [57.0, 59.83], [61.0, 61.96], [64.0, 64.03], [65.0, 65.47], [68.0, 69.6], [70.0, 72.25], [73.0, 76.28], [83.0, 84.37], [88.0, 88.15], [94.0, 93.72], [102.0, 102.86], [107.0, 107.54], [109.0, 109.75], [110.0, 110.86], [114.0, 113.83], [118.0, 121.98], [124.0, 125.05], [128.0, 128.29]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.48, 0.0, 72.16, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 44.4, 0.0, 0.0, 0.0, 0.0, 34.72, 39.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 10.26], ["creak", 9.94], ["hum", 7.54]], null, null, null, null, null, null, null, null, [["music", 46.64], ["mains hum", 9.14], ["hum", 8.4]], null, null, null, null, [["music", 30.01], ["speech", 22.26], ["cattle, bovinae", 7.49]], [["music", 52.85], ["cattle, bovinae", 5.04], ["musical instrument", 4.53]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 61.53], ["cattle, bovinae", 11.51], ["moo", 7.85]], null, null], "duration": [0.22, 0.52, 2.2, 1.5, 4.34, 1.17, 1.62, 1.48, 20.14, 0.64, 1.0, 2.83, 0.96, 0.03, 0.47, 1.6, 2.25, 3.28, 1.37, 0.15, -0.28, 0.86, 0.54, 0.75, 0.86, -0.17, 3.98, 1.05, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/jXIFh5Gwqno_filtered.json b/annotations_filtered/jXIFh5Gwqno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d5c57cae09c4ffd213b5a4d750f640f289b1f40 --- /dev/null +++ b/annotations_filtered/jXIFh5Gwqno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.98], [35.0, 38.94], [39.0, 39.46], [46.0, 51.75], [56.0, 62.82], [65.0, 68.01], [76.0, 76.47], [80.0, 80.33], [84.0, 90.95], [94.0, 96.42], [99.0, 105.44], [107.0, 106.64], [108.0, 111.25], [130.0, 130.82], [132.0, 142.57], [150.0, 152.09], [154.0, 162.65], [163.0, 163.75], [164.0, 164.47], [166.0, 167.54], [169.0, 170.24]], "keep_status": [false, false, false, true, true, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 37.21, 0.0, 31.26, 43.35, 82.61, 0.0, 0.0, 64.29, 32.33, 31.52, 0.0, 34.11, 0.0, 30.26, 99.71, 31.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.58], ["boing", 29.42], ["music", 13.03]], null, [["music", 39.42], ["boing", 23.6], ["cattle, bovinae", 4.42]], [["music", 58.01], ["speech", 6.39], ["hum", 5.21]], null, null, null, null, [["music", 33.29], ["speech", 14.36], ["cattle, bovinae", 11.85]], [["music", 33.0], ["boing", 26.22], ["speech", 10.25]], null, [["music", 56.57], ["groan", 4.82], ["cattle, bovinae", 3.96]], null, [["music", 59.28], ["noise", 5.28], ["theremin", 4.6]], null, [["music", 68.99], ["hum", 5.99], ["foghorn", 2.89]], null, null, null, null], "duration": [-0.02, 3.94, 0.46, 5.75, 6.82, 3.01, 0.47, 0.33, 6.95, 2.42, 6.44, -0.36, 3.25, 0.82, 10.57, 2.09, 8.65, 0.75, 0.47, 1.54, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/jXKc-0nVIkQ_filtered.json b/annotations_filtered/jXKc-0nVIkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bddb5fbe4ff10f28bfbc4dd5768a32e10d016cc5 --- /dev/null +++ b/annotations_filtered/jXKc-0nVIkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [17.0, 18.42], [19.0, 20.36], [22.0, 23.3], [24.0, 24.46], [26.0, 29.39], [31.0, 33.07], [46.0, 47.01], [48.0, 69.8], [70.0, 79.07], [84.0, 87.51], [89.0, 90.14], [97.0, 101.93], [103.0, 107.47], [108.0, 108.92], [116.0, 118.52], [129.0, 128.82], [132.0, 132.78], [137.0, 137.12], [137.0, 141.79], [142.0, 141.83], [142.0, 141.86], [142.0, 141.89], [142.0, 141.93], [142.0, 141.96], [142.0, 141.99], [142.0, 142.03], [144.0, 150.35], [151.0, 152.66], [154.0, 154.33], [154.0, 161.32], [162.0, 166.68], [169.0, 169.75], [171.0, 171.93], [173.0, 174.12], [175.0, 177.21]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.78, 55.18, 0.0, 30.91, 28.42, 28.8, 0.0, 29.03, 29.11, 0.0, 29.16, 0.0, 0.0, 0.0, 28.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 35.44, 35.87, 0.0, 0.0, 0.0, 50.02], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 44.4], ["mosquito", 38.37], ["insect", 7.71]], null, null, [["noise", 31.35], ["grunt", 14.19], ["speech", 8.34]], [["music", 28.63], ["hum", 11.15], ["mains hum", 11.08]], [["speech", 20.74], ["vehicle", 16.45], ["cacophony", 5.04]], null, [["vehicle", 28.05], ["speech", 23.46], ["car", 8.79]], [["speech", 40.3], ["buzzer", 9.12], ["buzz", 7.66]], null, [["vehicle", 43.41], ["car", 8.22], ["whir", 4.98]], null, null, null, [["speech", 18.92], ["roaring cats (lions, tigers)", 16.91], ["fart", 11.4]], null, null, null, null, null, null, null, [["hum", 48.38], ["mains hum", 35.42], ["electric shaver, electric razor", 3.23]], null, null, [["creak", 31.69], ["mechanisms", 8.19], ["animal", 6.61]], [["music", 55.98], ["hum", 8.19], ["mains hum", 5.73]], null, null, null, null], "duration": [0.59, 1.42, 1.36, 1.3, 0.46, 3.39, 2.07, 1.01, 21.8, 9.07, 3.51, 1.14, 4.93, 4.47, 0.92, 2.52, -0.18, 0.78, 0.12, 4.79, -0.17, -0.14, -0.11, -0.07, -0.04, -0.01, 0.03, 6.35, 1.66, 0.33, 7.32, 4.68, 0.75, 0.93, 1.12, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/jXReN1Nzlws_filtered.json b/annotations_filtered/jXReN1Nzlws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..369499a1466a7c13af386a85477f681d9f0c8607 --- /dev/null +++ b/annotations_filtered/jXReN1Nzlws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.02], [30.0, 30.67], [42.0, 43.63], [45.0, 50.3], [52.0, 52.22], [61.0, 62.19], [63.0, 63.61], [64.0, 64.93], [67.0, 82.22], [82.0, 82.29], [82.0, 83.05], [86.0, 98.29], [101.0, 103.5], [138.0, 139.63], [145.0, 146.82], [149.0, 149.44], [151.0, 155.09]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.72, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0, 30.54, 31.07, 0.0, 0.0, 0.0, 34.82], "audiomae_on_audioset": [null, null, null, [["speech", 27.63], ["animal", 19.54], ["frog", 14.99]], null, null, null, null, [["music", 76.41], ["cacophony", 8.27], ["synthesizer", 3.1]], null, null, [["music", 71.99], ["boing", 8.41], ["speech", 6.69]], [["music", 35.2], ["speech", 13.41], ["boing", 7.11]], null, null, null, [["music", 44.18], ["speech", 21.88], ["boing", 8.78]]], "duration": [1.02, 0.67, 1.63, 5.3, 0.22, 1.19, 0.61, 0.93, 15.22, 0.29, 1.05, 12.29, 2.5, 1.63, 1.82, 0.44, 4.09]} \ No newline at end of file diff --git a/annotations_filtered/jXb09CCPFO4_filtered.json b/annotations_filtered/jXb09CCPFO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a94c161953a98a7f5c1f0e1e571814fde7553651 --- /dev/null +++ b/annotations_filtered/jXb09CCPFO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.68], [14.0, 15.13], [16.0, 43.8], [46.0, 46.14], [47.0, 47.97], [49.0, 50.99], [59.0, 59.53], [63.0, 63.39], [65.0, 65.04], [69.0, 70.09], [74.0, 75.59], [77.0, 77.36], [81.0, 82.24], [85.0, 85.97], [88.0, 102.24], [105.0, 105.98]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.57], ["brass instrument", 13.27], ["speech", 12.68]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.13, 27.8, 0.14, 0.97, 1.99, 0.53, 0.39, 0.04, 1.09, 1.59, 0.36, 1.24, 0.97, 14.24, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/jY2PzzjO3zo_filtered.json b/annotations_filtered/jY2PzzjO3zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed2710d1fa26516cb3c1596cb6d45ea3d61658d8 --- /dev/null +++ b/annotations_filtered/jY2PzzjO3zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.84], [12.0, 12.55], [18.0, 18.4], [37.0, 37.59], [42.0, 42.96], [54.0, 54.18], [61.0, 61.72], [64.0, 64.23], [65.0, 65.5], [78.0, 78.02], [85.0, 86.27], [92.0, 95.3], [96.0, 96.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 33.67], ["hum", 22.07], ["mains hum", 15.84]], null], "duration": [0.84, 0.55, 0.4, 0.59, 0.96, 0.18, 0.72, 0.23, 0.5, 0.02, 1.27, 3.3, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/jY4nU1rwWv8_filtered.json b/annotations_filtered/jY4nU1rwWv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9cc925ffbf9693256f33392b32435e16fb5869 --- /dev/null +++ b/annotations_filtered/jY4nU1rwWv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.6], [23.0, 26.65], [36.0, 37.18], [42.0, 42.11], [43.0, 43.21], [43.0, 43.41], [44.0, 56.29], [67.0, 69.62], [84.0, 84.55], [90.0, 92.26], [93.0, 94.53], [95.0, 128.07], [128.0, 128.53], [134.0, 143.01], [146.0, 146.7]], "keep_status": [false, true, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [33.09, 45.69, 0.0, 0.0, 0.0, 0.0, 34.35, 36.79, 0.0, 33.57, 0.0, 0.0, 0.0, 37.03, 0.0], "audiomae_on_audioset": [[["music", 54.47], ["speech", 15.63], ["explosion", 3.51]], [["music", 24.0], ["speech", 12.05], ["breaking", 8.45]], null, null, null, null, [["music", 29.41], ["speech", 20.07], ["whack, thwack", 6.95]], [["music", 23.27], ["thunk", 10.97], ["animal", 6.46]], null, [["speech", 26.65], ["music", 24.3], ["sidetone", 7.48]], null, null, null, [["speech", 44.51], ["music", 31.88], ["whack, thwack", 4.07]], null], "duration": [12.6, 3.65, 1.18, 0.11, 0.21, 0.41, 12.29, 2.62, 0.55, 2.26, 1.53, 33.07, 0.53, 9.01, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/jYID_csTvos_filtered.json b/annotations_filtered/jYID_csTvos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fea4b05478d36ef714771d14a926ae75f13e0c30 --- /dev/null +++ b/annotations_filtered/jYID_csTvos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [6.0, 9.37], [32.0, 33.78], [50.0, 51.97], [56.0, 60.12], [63.0, 64.47], [67.0, 69.15], [75.0, 76.44], [81.0, 107.11]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.05, 0.0, 0.0, 31.24, 0.0, 31.38, 0.0, 31.95], "audiomae_on_audioset": [null, [["music", 74.73], ["synthesizer", 4.66], ["musical instrument", 3.59]], null, null, [["music", 72.51], ["didgeridoo", 6.14], ["reggae", 3.99]], null, [["music", 80.77], ["didgeridoo", 5.86], ["musical instrument", 2.13]], null, [["music", 74.76], ["musical instrument", 3.97], ["synthesizer", 3.14]]], "duration": [0.49, 3.37, 1.78, 1.97, 4.12, 1.47, 2.15, 1.44, 26.11]} \ No newline at end of file diff --git a/annotations_filtered/jYbI8iVYCpc_filtered.json b/annotations_filtered/jYbI8iVYCpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..345c23471a525385719128207de8c7eb53c10cb2 --- /dev/null +++ b/annotations_filtered/jYbI8iVYCpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [9.0, 9.12], [13.0, 14.03], [14.0, 16.95], [18.0, 19.01], [20.0, 21.15], [23.0, 27.31], [28.0, 29.71], [30.0, 35.06], [38.0, 54.36], [55.0, 64.15]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 45.88, 0.0, 63.85, 92.64, 29.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.13], ["hum", 5.96], ["chirp tone", 5.78]], null, null, null, [["mains hum", 34.66], ["hum", 16.62], ["noise", 14.66]]], "duration": [1.56, 0.12, 1.03, 2.95, 1.01, 1.15, 4.31, 1.71, 5.06, 16.36, 9.15]} \ No newline at end of file diff --git a/annotations_filtered/jYnRBX2Trtk_filtered.json b/annotations_filtered/jYnRBX2Trtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe85637897dcd2efedf58c53aadf8ec3d1fcdedc --- /dev/null +++ b/annotations_filtered/jYnRBX2Trtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [4.0, 9.1], [11.0, 11.58], [16.0, 17.51], [40.0, 40.29], [45.0, 45.37], [47.0, 49.03], [60.0, 60.29], [63.0, 63.04], [66.0, 67.15], [68.0, 69.9], [75.0, 81.33], [83.0, 83.32], [84.0, 87.05], [93.0, 93.26], [94.0, 95.93], [96.0, 96.9], [100.0, 101.24], [104.0, 104.99], [106.0, 106.74], [107.0, 113.41], [117.0, 118.94], [119.0, 121.34], [123.0, 125.58], [129.0, 131.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.98, 0.0, 93.6, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 28.11], ["whack, thwack", 7.16], ["sidetone", 5.33]], null, null, null, null, null, null, [["speech", 77.96], ["thunk", 7.17], ["sidetone", 2.93]], null, null, null, null], "duration": [1.47, 5.1, 0.58, 1.51, 0.29, 0.37, 2.03, 0.29, 0.04, 1.15, 1.9, 6.33, 0.32, 3.05, 0.26, 1.93, 0.9, 1.24, 0.99, 0.74, 6.41, 1.94, 2.34, 2.58, 2.21]} \ No newline at end of file diff --git a/annotations_filtered/jYpYTpKuT_k_filtered.json b/annotations_filtered/jYpYTpKuT_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..591fd6f606d488993d28924ff0df9b757ca5bd53 --- /dev/null +++ b/annotations_filtered/jYpYTpKuT_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.3], [8.0, 21.12], [24.0, 34.52], [38.0, 42.03], [43.0, 53.22], [57.0, 68.72], [69.0, 73.14], [76.0, 76.27], [79.0, 79.86], [86.0, 97.85], [100.0, 112.6], [114.0, 115.6], [118.0, 144.95]], "keep_status": [false, false, false, true, true, true, true, false, false, true, false, false, false], "silence_prob": [28.64, 28.55, 28.8, 28.9, 28.86, 28.73, 28.73, 0.0, 0.0, 28.7, 28.97, 0.0, 28.44], "audiomae_on_audioset": [[["speech", 42.57], ["mains hum", 17.56], ["hum", 12.02]], [["music", 70.26], ["mains hum", 3.55], ["hum", 3.15]], [["speech", 65.77], ["music", 11.31], ["burst, pop", 1.79]], [["speech", 31.77], ["music", 18.49], ["foghorn", 16.53]], [["speech", 31.82], ["music", 20.36], ["whack, thwack", 9.35]], [["music", 26.98], ["speech", 18.11], ["whack, thwack", 13.84]], [["speech", 49.39], ["rumble", 15.03], ["whoosh, swoosh, swish", 4.87]], null, null, [["music", 23.29], ["whack, thwack", 17.99], ["smash, crash", 16.82]], [["speech", 61.23], ["music", 23.03], ["explosion", 1.62]], null, [["music", 77.08], ["mains hum", 2.46], ["hum", 2.38]]], "duration": [6.3, 13.12, 10.52, 4.03, 10.22, 11.72, 4.14, 0.27, 0.86, 11.85, 12.6, 1.6, 26.95]} \ No newline at end of file diff --git a/annotations_filtered/jYrKqg2TqUo_filtered.json b/annotations_filtered/jYrKqg2TqUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c873a20bb4039e122527cd9543b09fa27a1a06da --- /dev/null +++ b/annotations_filtered/jYrKqg2TqUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.76], [33.0, 47.01], [47.0, 64.74], [65.0, 125.05], [126.0, 127.8], [129.0, 130.42]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 93.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.76, 14.01, 17.74, 60.05, 1.8, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/jZXHcvhr2p8_filtered.json b/annotations_filtered/jZXHcvhr2p8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..918b989ad1159585065ea9f9988021c1aaf6aba7 --- /dev/null +++ b/annotations_filtered/jZXHcvhr2p8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.09], [21.0, 32.98], [37.0, 48.54], [51.0, 52.22], [55.0, 55.36], [59.0, 60.29], [66.0, 67.34], [68.0, 75.41], [76.0, 77.4], [79.0, 80.38], [83.0, 83.03], [92.0, 91.91], [95.0, 94.98], [103.0, 103.37], [110.0, 110.32]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.82, 32.5, 0.0, 0.0, 0.0, 0.0, 31.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 31.49], ["cattle, bovinae", 20.64], ["moo", 9.53]], [["music", 37.48], ["effects unit", 11.64], ["thunk", 8.48]], null, null, null, null, [["speech", 20.67], ["music", 14.05], ["fly, housefly", 11.72]], null, null, null, null, null, null, null], "duration": [0.09, 11.98, 11.54, 1.22, 0.36, 1.29, 1.34, 7.41, 1.4, 1.38, 0.03, -0.09, -0.02, 0.37, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/jZXuLQdIrEg_filtered.json b/annotations_filtered/jZXuLQdIrEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d22bd873b3c3835a17d3628c6ad68e5aba78bec --- /dev/null +++ b/annotations_filtered/jZXuLQdIrEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [5.0, 5.8], [6.0, 7.55], [9.0, 9.73], [12.0, 12.51], [13.0, 13.32], [14.0, 15.15], [16.0, 17.02], [20.0, 20.71], [22.0, 23.01], [26.0, 26.0], [29.0, 30.43], [31.0, 32.39], [34.0, 35.31], [38.0, 41.69], [43.0, 43.68], [45.0, 45.4], [46.0, 47.01], [49.0, 51.63], [53.0, 52.89], [54.0, 59.36], [60.0, 61.25], [63.0, 63.9], [64.0, 64.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 96.29, 0.0, 57.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.8, 1.55, 0.73, 0.51, 0.32, 1.15, 1.02, 0.71, 1.01, 0.0, 1.43, 1.39, 1.31, 3.69, 0.68, 0.4, 1.01, 2.63, -0.11, 5.36, 1.25, 0.9, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/jZiR9MHumCk_filtered.json b/annotations_filtered/jZiR9MHumCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04aca8c2545f9757c5b062ea16f8bf61522c4c02 --- /dev/null +++ b/annotations_filtered/jZiR9MHumCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.87], [11.0, 12.36], [13.0, 12.7], [20.0, 24.7], [26.0, 27.18], [29.0, 28.81], [31.0, 30.99], [32.0, 32.63], [34.0, 35.4], [36.0, 37.52], [39.0, 40.46], [42.0, 43.31], [45.0, 71.09], [72.0, 74.22], [75.0, 106.76]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [31.09, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.1, 49.18, 0.0], "audiomae_on_audioset": [[["mains hum", 39.76], ["hum", 31.07], ["throbbing", 7.91]], null, null, [["music", 31.57], ["musical instrument", 5.41], ["theremin", 5.06]], null, null, null, null, null, null, null, null, [["music", 31.34], ["speech", 14.54], ["buzz", 11.0]], [["speech", 25.73], ["music", 20.78], ["whale vocalization", 4.06]], null], "duration": [5.87, 1.36, -0.3, 4.7, 1.18, -0.19, -0.01, 0.63, 1.4, 1.52, 1.46, 1.31, 26.09, 2.22, 31.76]} \ No newline at end of file diff --git a/annotations_filtered/jZtlV8eroS8_filtered.json b/annotations_filtered/jZtlV8eroS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8437571cd7555f4fed74031052712c97b264b6c9 --- /dev/null +++ b/annotations_filtered/jZtlV8eroS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.01], [20.0, 21.03], [35.0, 37.52]], "keep_status": [false, false, false], "silence_prob": [91.98, 0.0, 99.91], "audiomae_on_audioset": [null, null, null], "duration": [3.01, 1.03, 2.52]} \ No newline at end of file diff --git a/annotations_filtered/jZyhfkpsGGI_filtered.json b/annotations_filtered/jZyhfkpsGGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54e26a0ffdaa1a15bdec6b9f550e6ecc305cade8 --- /dev/null +++ b/annotations_filtered/jZyhfkpsGGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.76], [32.0, 106.07], [107.0, 113.88], [114.0, 141.3], [144.0, 144.32], [145.0, 145.61], [150.0, 150.53], [151.0, 152.52], [154.0, 153.69], [154.0, 155.9], [157.0, 162.43], [164.0, 168.99], [172.0, 172.17], [173.0, 187.32], [189.0, 195.15], [198.0, 215.99]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [46.29, 0.0, 33.09, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.67, 31.99, 0.0, 32.81, 31.54, 31.53], "audiomae_on_audioset": [[["vehicle", 9.73], ["effects unit", 9.68], ["chainsaw", 7.55]], null, [["whale vocalization", 20.8], ["hum", 4.41], ["chainsaw", 4.05]], [["noise", 22.25], ["buzz", 19.5], ["fart", 4.77]], null, null, null, null, null, null, [["whale vocalization", 44.79], ["livestock, farm animals, working animals", 13.45], ["cattle, bovinae", 11.83]], [["speech", 14.5], ["motorcycle", 13.32], ["vehicle", 10.37]], null, [["music", 12.37], ["sidetone", 12.02], ["effects unit", 10.35]], [["motorcycle", 31.42], ["vehicle", 21.31], ["accelerating, revving, vroom", 12.25]], [["speech", 28.13], ["hum", 18.46], ["electric shaver, electric razor", 13.18]]], "duration": [2.76, 74.07, 6.88, 27.3, 0.32, 0.61, 0.53, 1.52, -0.31, 1.9, 5.43, 4.99, 0.17, 14.32, 6.15, 17.99]} \ No newline at end of file diff --git a/annotations_filtered/j_1k-SzcOrs_filtered.json b/annotations_filtered/j_1k-SzcOrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb2f3a68085855fd2ad980409a6cc4869eb6415d --- /dev/null +++ b/annotations_filtered/j_1k-SzcOrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.96], [34.0, 38.04], [38.0, 38.08], [42.0, 45.27], [49.0, 49.52], [55.0, 55.58], [59.0, 65.1], [70.0, 72.35], [97.0, 97.85], [99.0, 101.14], [108.0, 108.33], [112.0, 114.44], [118.0, 117.58], [118.0, 118.42], [119.0, 119.91], [123.0, 124.71], [126.0, 127.04], [128.0, 131.58], [132.0, 133.0], [135.0, 137.61], [138.0, 139.67], [144.0, 144.9], [146.0, 145.62], [155.0, 155.6], [158.0, 158.09], [162.0, 163.27], [165.0, 165.94]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.73, 41.85, 0.0, 42.11, 0.0, 0.0, 32.07, 45.14, 0.0, 58.98, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.74], ["vehicle", 15.53], ["car", 9.59]], [["speech", 33.28], ["sidetone", 32.61], ["music", 5.96]], null, [["speech", 26.92], ["music", 15.39], ["sidetone", 7.3]], null, null, [["speech", 61.26], ["vehicle", 6.98], ["hum", 4.77]], [["speech", 38.54], ["music", 20.34], ["sidetone", 10.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.96, 4.04, 0.08, 3.27, 0.52, 0.58, 6.1, 2.35, 0.85, 2.14, 0.33, 2.44, -0.42, 0.42, 0.91, 1.71, 1.04, 3.58, 1.0, 2.61, 1.67, 0.9, -0.38, 0.6, 0.09, 1.27, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/j_2-8115ZAs_filtered.json b/annotations_filtered/j_2-8115ZAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c82ac9b6e474af2ad94bc51389459fd6a525cbdb --- /dev/null +++ b/annotations_filtered/j_2-8115ZAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 25.89], [30.0, 31.04], [39.0, 38.53]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.11, 1.04, -0.47]} \ No newline at end of file diff --git a/annotations_filtered/j_3wS3OIgc8_filtered.json b/annotations_filtered/j_3wS3OIgc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6787197433cb968f3ad5201a6e00c95dd00226b9 --- /dev/null +++ b/annotations_filtered/j_3wS3OIgc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.39], [31.0, 83.96], [91.0, 98.74], [115.0, 116.21], [117.0, 116.97], [117.0, 130.37], [135.0, 141.47], [143.0, 143.21], [149.0, 160.41]], "keep_status": [false, false, true, false, false, true, true, false, true], "silence_prob": [32.81, 0.0, 30.54, 0.0, 0.0, 34.19, 33.06, 0.0, 39.09], "audiomae_on_audioset": [[["speech", 48.38], ["music", 22.93], ["boing", 3.45]], null, [["speech", 56.42], ["frog", 7.23], ["fart", 3.81]], null, null, [["fart", 30.62], ["speech", 23.95], ["livestock, farm animals, working animals", 7.95]], [["speech", 20.79], ["laughter", 12.71], ["animal", 5.63]], null, [["speech", 38.39], ["animal", 11.83], ["livestock, farm animals, working animals", 9.64]]], "duration": [4.39, 52.96, 7.74, 1.21, -0.03, 13.37, 6.47, 0.21, 11.41]} \ No newline at end of file diff --git a/annotations_filtered/j_UtDuZaeZo_filtered.json b/annotations_filtered/j_UtDuZaeZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94d384725a13cd5d50d857cf0cc083fe4a42e538 --- /dev/null +++ b/annotations_filtered/j_UtDuZaeZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 92.1], [95.0, 101.61], [105.0, 123.7], [126.0, 165.65]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 33.25, 32.2, 0.0], "audiomae_on_audioset": [null, [["music", 59.71], ["didgeridoo", 10.88], ["synthesizer", 4.53]], [["music", 70.33], ["didgeridoo", 8.39], ["brass instrument", 4.16]], null], "duration": [86.1, 6.61, 18.7, 39.65]} \ No newline at end of file diff --git a/annotations_filtered/j_a_zvQOrIE_filtered.json b/annotations_filtered/j_a_zvQOrIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9aded9861016a7682994ae659a36303933fc7a9 --- /dev/null +++ b/annotations_filtered/j_a_zvQOrIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.43], [6.0, 10.18], [11.0, 16.6], [19.0, 21.47], [22.0, 27.43], [29.0, 30.72], [33.0, 33.25], [35.0, 35.99], [37.0, 38.96], [40.0, 43.44], [44.0, 47.07], [48.0, 50.53], [51.0, 53.45], [54.0, 60.13], [61.0, 64.44], [66.0, 68.23], [69.0, 71.47], [73.0, 74.88], [77.0, 80.18], [81.0, 82.48], [83.0, 85.35], [87.0, 100.04], [101.0, 103.05], [106.0, 108.85], [112.0, 113.05], [115.0, 125.54], [126.0, 127.67], [129.0, 132.33], [136.0, 136.49], [137.0, 139.51], [140.0, 148.95], [151.0, 156.03], [157.0, 162.62], [164.0, 176.01], [178.0, 179.36], [180.0, 182.58], [184.0, 187.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 90.6, 89.54, 89.9, 0.0, 0.0, 0.0, 0.0, 85.35, 100.0, 99.99, 91.98, 99.85, 100.0, 100.0, 96.17, 0.0, 98.99, 0.0, 99.78, 99.85, 100.0, 100.0, 0.0, 77.2, 0.0, 89.36, 0.0, 91.13, 77.36, 76.7, 67.0, 66.88, 0.0, 70.3, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 4.18, 5.6, 2.47, 5.43, 1.72, 0.25, 0.99, 1.96, 3.44, 3.07, 2.53, 2.45, 6.13, 3.44, 2.23, 2.47, 1.88, 3.18, 1.48, 2.35, 13.04, 2.05, 2.85, 1.05, 10.54, 1.67, 3.33, 0.49, 2.51, 8.95, 5.03, 5.62, 12.01, 1.36, 2.58, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/j_sD0t5L8kE_filtered.json b/annotations_filtered/j_sD0t5L8kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdfc6fa07f98a0e10684d6249fdaa278525dc455 --- /dev/null +++ b/annotations_filtered/j_sD0t5L8kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.16], [29.0, 32.0], [33.0, 37.25], [38.0, 41.86], [47.0, 48.0], [50.0, 50.62], [53.0, 53.77], [57.0, 58.09], [61.0, 62.61], [63.0, 65.08], [66.0, 70.19], [72.0, 72.89], [75.0, 76.05], [80.0, 81.31], [83.0, 85.62], [87.0, 89.02], [90.0, 91.62], [92.0, 92.65], [93.0, 95.37], [98.0, 99.27], [101.0, 104.4], [105.0, 107.32], [109.0, 113.51], [117.0, 118.5], [122.0, 123.79], [125.0, 126.55], [128.0, 128.58], [131.0, 133.05], [135.0, 136.02], [138.0, 139.72], [148.0, 149.2], [150.0, 151.38], [154.0, 156.05], [158.0, 158.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.0, 80.29, 95.09, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 74.29, 0.0, 0.0, 0.0, 96.42, 52.51, 0.0, 0.0, 100.0, 0.0, 99.16, 42.22, 72.75, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.54], ["telephone", 8.26], ["radio", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.16, 3.0, 4.25, 3.86, 1.0, 0.62, 0.77, 1.09, 1.61, 2.08, 4.19, 0.89, 1.05, 1.31, 2.62, 2.02, 1.62, 0.65, 2.37, 1.27, 3.4, 2.32, 4.51, 1.5, 1.79, 1.55, 0.58, 2.05, 1.02, 1.72, 1.2, 1.38, 2.05, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/j_txRPwTvpk_filtered.json b/annotations_filtered/j_txRPwTvpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..771b42fca4b0fe6bc0005e997bb9180b56f3a10d --- /dev/null +++ b/annotations_filtered/j_txRPwTvpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [9.0, 8.97], [16.0, 16.61], [18.0, 19.35], [20.0, 22.55], [24.0, 25.35], [26.0, 27.72], [29.0, 29.76], [34.0, 34.15], [35.0, 35.9], [49.0, 49.05], [50.0, 50.45], [55.0, 55.71], [63.0, 81.87], [83.0, 85.5], [86.0, 86.8], [88.0, 91.64], [93.0, 93.38], [94.0, 96.16], [97.0, 98.25], [99.0, 100.18]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.9, 28.72, 0.0, 29.89, 0.0, 35.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 18.54], ["telephone", 14.49], ["hum", 14.3]], null, null, null, null, null, null, null, null, [["music", 41.63], ["noise", 15.58], ["hum", 6.0]], [["speech", 11.4], ["music", 6.57], ["insect", 5.26]], null, [["throbbing", 12.52], ["hum", 11.87], ["fly, housefly", 11.84]], null, [["cattle, bovinae", 50.41], ["moo", 26.23], ["livestock, farm animals, working animals", 21.5]], null, null], "duration": [0.66, -0.03, 0.61, 1.35, 2.55, 1.35, 1.72, 0.76, 0.15, 0.9, 0.05, 0.45, 0.71, 18.87, 2.5, 0.8, 3.64, 0.38, 2.16, 1.25, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/j_z70ZaqWUE_filtered.json b/annotations_filtered/j_z70ZaqWUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1419d676ec3cceac97a9c2502c7af669e6c1dd1f --- /dev/null +++ b/annotations_filtered/j_z70ZaqWUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [13.0, 16.41], [20.0, 21.59], [24.0, 24.98], [25.0, 26.0], [27.0, 37.08], [45.0, 44.81], [50.0, 50.58], [58.0, 58.43], [60.0, 60.37], [61.0, 61.32], [78.0, 78.61], [83.0, 84.0], [88.0, 89.02], [90.0, 90.56], [91.0, 92.15], [94.0, 96.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.83, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 3.41, 1.59, 0.98, 1.0, 10.08, -0.19, 0.58, 0.43, 0.37, 0.32, 0.61, 1.0, 1.02, 0.56, 1.15, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/ja00D_L5tm8_filtered.json b/annotations_filtered/ja00D_L5tm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a2ef8f0d0683038b1bf5eda033763681b4fcec8 --- /dev/null +++ b/annotations_filtered/ja00D_L5tm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.51], [15.0, 24.12], [26.0, 28.49], [30.0, 35.24], [36.0, 37.89], [39.0, 40.04], [42.0, 43.9], [44.0, 44.85], [46.0, 58.56], [63.0, 71.68], [72.0, 75.47], [78.0, 79.83], [82.0, 81.7], [84.0, 85.24], [89.0, 90.14], [92.0, 92.69], [93.0, 93.23], [94.0, 95.44], [99.0, 100.08], [101.0, 102.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 53.4, 75.39, 72.16, 0.0, 0.0, 0.0, 0.0, 91.13, 53.84, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 9.12, 2.49, 5.24, 1.89, 1.04, 1.9, 0.85, 12.56, 8.68, 3.47, 1.83, -0.3, 1.24, 1.14, 0.69, 0.23, 1.44, 1.08, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/ja4l7-L7n6M_filtered.json b/annotations_filtered/ja4l7-L7n6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..855cf58f1c2924635756a808483fac59a814d31d --- /dev/null +++ b/annotations_filtered/ja4l7-L7n6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [6.0, 8.29], [9.0, 12.9], [14.0, 16.07], [19.0, 37.22], [38.0, 38.57], [39.0, 40.83], [41.0, 42.63], [44.0, 46.84], [48.0, 54.11], [57.0, 74.83], [76.0, 78.53], [80.0, 80.69], [81.0, 83.25], [84.0, 86.27], [88.0, 88.65], [90.0, 90.15], [91.0, 92.25], [94.0, 94.74], [96.0, 99.35], [100.0, 100.25], [102.0, 103.08], [105.0, 104.57], [107.0, 110.94], [112.0, 113.27], [116.0, 119.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 65.2, 97.33, 98.99, 70.86, 0.0, 0.0, 0.0, 56.63, 46.36, 99.31, 96.17, 0.0, 100.0, 55.18, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.01, 0.0, 41.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 78.23], ["synthesizer", 3.8], ["speech", 2.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.86], ["music", 9.59], ["effects unit", 4.71]]], "duration": [0.53, 2.29, 3.9, 2.07, 18.22, 0.57, 1.83, 1.63, 2.84, 6.11, 17.83, 2.53, 0.69, 2.25, 2.27, 0.65, 0.15, 1.25, 0.74, 3.35, 0.25, 1.08, -0.43, 3.94, 1.27, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/jaCofC2Bv-c_filtered.json b/annotations_filtered/jaCofC2Bv-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c6f8e2b8694e8328818afe44fbe4a9c097ae0c4 --- /dev/null +++ b/annotations_filtered/jaCofC2Bv-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.72], [4.0, 4.02], [8.0, 9.04], [11.0, 12.16], [13.0, 15.03], [18.0, 19.33], [21.0, 21.98], [29.0, 30.37], [35.0, 39.38], [40.0, 42.09], [43.0, 44.0], [49.0, 51.46], [52.0, 53.08], [54.0, 54.92], [56.0, 57.89], [59.0, 59.43], [61.0, 63.29], [64.0, 63.71], [64.0, 64.98], [69.0, 69.13], [78.0, 79.32], [82.0, 83.17], [84.0, 87.25], [88.0, 95.17], [96.0, 96.92], [99.0, 100.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 99.84, 77.2, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 46.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 78.58], ["speech", 12.59], ["thunk", 1.49]], null, null], "duration": [-0.28, 0.02, 1.04, 1.16, 2.03, 1.33, 0.98, 1.37, 4.38, 2.09, 1.0, 2.46, 1.08, 0.92, 1.89, 0.43, 2.29, -0.29, 0.98, 0.13, 1.32, 1.17, 3.25, 7.17, 0.92, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/jaM0sgoi0vw_filtered.json b/annotations_filtered/jaM0sgoi0vw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/jaM0sgoi0vw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/jaRbZJBLIQo_filtered.json b/annotations_filtered/jaRbZJBLIQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38fb813c2bdfa171053cfa57bb733770f42f18fc --- /dev/null +++ b/annotations_filtered/jaRbZJBLIQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [8.0, 9.46], [14.0, 33.15], [38.0, 38.58], [41.0, 41.5], [43.0, 43.28], [48.0, 49.98], [57.0, 57.87], [61.0, 62.16], [73.0, 73.63], [78.0, 78.92], [89.0, 89.02], [90.0, 90.37], [101.0, 102.03]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.67], ["throbbing", 12.26], ["speech", 12.02]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 1.46, 19.15, 0.58, 0.5, 0.28, 1.98, 0.87, 1.16, 0.63, 0.92, 0.02, 0.37, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/jaSSXV5AFHk_filtered.json b/annotations_filtered/jaSSXV5AFHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50400734df721ab07294453cbf865041e03c77a --- /dev/null +++ b/annotations_filtered/jaSSXV5AFHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.98], [50.0, 59.51], [60.0, 67.78], [70.0, 72.1], [74.0, 74.41], [75.0, 77.03], [81.0, 83.17], [86.0, 91.2], [92.0, 94.64], [96.0, 96.85], [97.0, 97.43], [100.0, 100.68], [102.0, 102.76], [104.0, 106.32], [107.0, 108.35], [110.0, 112.6], [113.0, 113.97], [115.0, 116.45], [118.0, 120.43]], "keep_status": [false, false, true, false, false, false, true, true, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 33.9, 37.65, 56.86, 0.0, 39.34, 38.28, 41.1, 43.15, 0.0, 0.0, 0.0, 0.0, 49.45, 0.0, 37.44, 0.0, 0.0, 32.83], "audiomae_on_audioset": [null, [["music", 49.89], ["synthesizer", 18.67], ["musical instrument", 9.95]], [["music", 55.02], ["effects unit", 8.59], ["chorus effect", 6.33]], null, null, [["sidetone", 43.6], ["speech", 17.34], ["music", 12.73]], [["music", 48.39], ["musical instrument", 9.83], ["synthesizer", 9.27]], [["music", 32.94], ["hum", 19.89], ["mains hum", 9.05]], [["hum", 29.03], ["mains hum", 15.03], ["music", 11.26]], null, null, null, null, [["hum", 35.94], ["mains hum", 35.46], ["speech", 2.8]], null, [["music", 34.11], ["speech", 14.75], ["sidetone", 7.78]], null, null, [["hum", 32.38], ["gong", 18.74], ["mains hum", 12.63]]], "duration": [0.98, 9.51, 7.78, 2.1, 0.41, 2.03, 2.17, 5.2, 2.64, 0.85, 0.43, 0.68, 0.76, 2.32, 1.35, 2.6, 0.97, 1.45, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/jagJeaLXRRQ_filtered.json b/annotations_filtered/jagJeaLXRRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9af6ec3f605c6c58b4f67e3936d28d70d5c866 --- /dev/null +++ b/annotations_filtered/jagJeaLXRRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.18], [3.0, 3.82], [14.0, 14.18], [17.0, 19.68], [20.0, 30.08], [31.0, 31.41], [32.0, 33.57], [34.0, 34.65], [36.0, 37.1], [46.0, 58.36], [64.0, 65.18], [66.0, 66.36], [71.0, 71.49], [80.0, 88.15], [94.0, 94.63], [96.0, 102.69], [103.0, 107.67], [109.0, 110.91], [112.0, 112.18], [115.0, 116.16], [120.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 39.72, 0.0, 0.0, 0.0, 87.19, 0.0, 41.07, 48.65, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 17.19], ["hum", 14.15], ["hammer", 6.82]], null, null, null, null, null, [["radio", 19.17], ["speech", 17.32], ["bee, wasp, etc.", 11.08]], [["fly, housefly", 60.08], ["insect", 24.18], ["bee, wasp, etc.", 10.19]], null, null, null, null], "duration": [0.18, 0.82, 0.18, 2.68, 10.08, 0.41, 1.57, 0.65, 1.1, 12.36, 1.18, 0.36, 0.49, 8.15, 0.63, 6.69, 4.67, 1.91, 0.18, 1.16, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/jal6Pf2DFlg_filtered.json b/annotations_filtered/jal6Pf2DFlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de28b379c41af7caa56c6de71237344c7964eeae --- /dev/null +++ b/annotations_filtered/jal6Pf2DFlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.37], [12.0, 12.21], [13.0, 20.04], [21.0, 21.0], [23.0, 23.35], [26.0, 27.78], [32.0, 32.09], [33.0, 32.93], [46.0, 48.05], [50.0, 50.3], [53.0, 53.59], [54.0, 76.87], [81.0, 83.17], [85.0, 86.22], [89.0, 88.86], [91.0, 92.96], [97.0, 98.64], [101.0, 101.78], [104.0, 106.74], [110.0, 110.71], [113.0, 112.78], [114.0, 116.19], [116.0, 117.0], [118.0, 122.01], [123.0, 124.04], [126.0, 126.96], [132.0, 132.46], [135.0, 136.17], [140.0, 148.73], [150.0, 151.66], [154.0, 155.68], [158.0, 159.16], [163.0, 165.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 56.63, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 96.54, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 25.64], ["telephone", 24.79], ["busy signal", 16.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.37, 0.21, 7.04, 0.0, 0.35, 1.78, 0.09, -0.07, 2.05, 0.3, 0.59, 22.87, 2.17, 1.22, -0.14, 1.96, 1.64, 0.78, 2.74, 0.71, -0.22, 2.19, 1.0, 4.01, 1.04, 0.96, 0.46, 1.17, 8.73, 1.66, 1.68, 1.16, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/javEwwHaNa4_filtered.json b/annotations_filtered/javEwwHaNa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64aac5833db1a22377fe25f2da4b71030fcd4332 --- /dev/null +++ b/annotations_filtered/javEwwHaNa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.4], [11.0, 13.58], [14.0, 18.59], [19.0, 33.56], [42.0, 45.4], [47.0, 48.9], [52.0, 59.83], [62.0, 75.17], [76.0, 81.84], [87.0, 103.82], [106.0, 110.89]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [71.43, 75.07, 69.34, 71.14, 34.35, 0.0, 31.73, 71.72, 71.0, 36.72, 34.75], "audiomae_on_audioset": [null, null, null, null, [["music", 32.53], ["didgeridoo", 5.94], ["speech", 4.73]], null, [["hum", 39.25], ["mains hum", 21.16], ["music", 17.45]], null, null, [["music", 44.92], ["guitar", 6.79], ["effects unit", 5.79]], [["music", 24.74], ["didgeridoo", 13.2], ["mosquito", 8.04]]], "duration": [2.4, 2.58, 4.59, 14.56, 3.4, 1.9, 7.83, 13.17, 5.84, 16.82, 4.89]} \ No newline at end of file diff --git a/annotations_filtered/jawZFND4Bfc_filtered.json b/annotations_filtered/jawZFND4Bfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed3197a2c83bc74f07fa8912d5ebb9e01fedb83 --- /dev/null +++ b/annotations_filtered/jawZFND4Bfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.63], [16.0, 18.84], [24.0, 24.66], [31.0, 32.48], [34.0, 34.6], [37.0, 38.08], [46.0, 46.92], [47.0, 50.38], [51.0, 56.74], [63.0, 64.15], [64.0, 64.96], [69.0, 70.01], [80.0, 80.76], [81.0, 83.03], [84.0, 84.08], [86.0, 86.63], [90.0, 91.15], [92.0, 93.9], [108.0, 107.87], [111.0, 111.62], [125.0, 125.68], [142.0, 142.6], [143.0, 145.69], [151.0, 150.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.35, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0], "audiomae_on_audioset": [[["music", 49.05], ["speech", 28.05], ["synthesizer", 2.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.63, 2.84, 0.66, 1.48, 0.6, 1.08, 0.92, 3.38, 5.74, 1.15, 0.96, 1.01, 0.76, 2.03, 0.08, 0.63, 1.15, 1.9, -0.13, 0.62, 0.68, 0.6, 2.69, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/jb0Cjzd2lKU_filtered.json b/annotations_filtered/jb0Cjzd2lKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f638340c455f371e0280930577e027819f12695 --- /dev/null +++ b/annotations_filtered/jb0Cjzd2lKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [4.0, 4.89], [6.0, 16.8], [18.0, 19.35], [21.0, 22.99], [23.0, 48.51], [50.0, 50.53], [52.0, 62.94], [65.0, 72.06]], "keep_status": [false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 31.62, 0.0, 0.0, 31.25, 0.0, 31.17, 30.01], "audiomae_on_audioset": [null, null, [["music", 52.13], ["electric shaver, electric razor", 18.09], ["speech", 7.85]], null, null, [["music", 25.62], ["electric shaver, electric razor", 22.0], ["hum", 18.33]], null, [["music", 23.66], ["hum", 18.55], ["mains hum", 17.46]], [["mains hum", 45.62], ["hum", 30.86], ["music", 7.05]]], "duration": [0.38, 0.89, 10.8, 1.35, 1.99, 25.51, 0.53, 10.94, 7.06]} \ No newline at end of file diff --git a/annotations_filtered/jbCyTUSQ6fY_filtered.json b/annotations_filtered/jbCyTUSQ6fY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..877f2a0eb13311e29684008e1c8cee425f2fd128 --- /dev/null +++ b/annotations_filtered/jbCyTUSQ6fY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [10.0, 10.13], [34.0, 34.01], [41.0, 44.88], [48.0, 52.95], [54.0, 55.65], [60.0, 60.45], [62.0, 62.61], [73.0, 74.55], [79.0, 80.05], [87.0, 87.24], [88.0, 90.78], [94.0, 95.03], [96.0, 97.48], [106.0, 107.16], [111.0, 111.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.35, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.13, 0.01, 3.88, 4.95, 1.65, 0.45, 0.61, 1.55, 1.05, 0.24, 2.78, 1.03, 1.48, 1.16, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/jbh5Q-eHULU_filtered.json b/annotations_filtered/jbh5Q-eHULU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39f9f715fedab4a9d74d0017e7530364b77ebd3c --- /dev/null +++ b/annotations_filtered/jbh5Q-eHULU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [7.0, 10.56], [11.0, 17.47], [19.0, 20.07], [22.0, 27.8], [37.0, 42.48], [56.0, 57.82], [62.0, 62.99], [72.0, 74.63], [75.0, 77.14], [78.0, 77.82], [79.0, 79.07], [88.0, 89.02], [93.0, 93.53], [94.0, 95.3], [96.0, 97.7], [111.0, 111.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 97.54, 0.0, 65.67, 92.15, 0.0, 0.0, 98.8, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 3.56, 6.47, 1.07, 5.8, 5.48, 1.82, 0.99, 2.63, 2.14, -0.18, 0.07, 1.02, 0.53, 1.3, 1.7, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/jbvQvJV_97M_filtered.json b/annotations_filtered/jbvQvJV_97M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6a3f937cef5c7422ad173b25e40abcac764a719 --- /dev/null +++ b/annotations_filtered/jbvQvJV_97M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.48], [40.0, 41.07], [43.0, 43.85], [46.0, 46.89], [48.0, 48.59], [54.0, 54.5], [57.0, 57.86], [59.0, 60.05], [69.0, 71.04], [72.0, 85.09], [90.0, 90.95], [92.0, 92.47], [96.0, 122.61], [123.0, 124.5], [125.0, 127.87], [130.0, 132.7], [133.0, 144.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 28.21, 0.0, 0.0, 28.62, 0.0, 28.43, 30.86, 29.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 39.96], ["music", 15.73], ["synthesizer", 5.07]], [["music", 42.95], ["hum", 17.24], ["mains hum", 10.58]], null, null, [["music", 30.96], ["hum", 16.89], ["mains hum", 10.45]], null, [["speech", 28.45], ["explosion", 25.07], ["burst, pop", 14.81]], [["music", 28.96], ["theremin", 16.47], ["didgeridoo", 7.62]], [["livestock, farm animals, working animals", 24.32], ["cattle, bovinae", 19.98], ["moo", 15.47]]], "duration": [1.48, 1.07, 0.85, 0.89, 0.59, 0.5, 0.86, 1.05, 2.04, 13.09, 0.95, 0.47, 26.61, 1.5, 2.87, 2.7, 11.44]} \ No newline at end of file diff --git a/annotations_filtered/jc2T3qbPJNI_filtered.json b/annotations_filtered/jc2T3qbPJNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d884b6cdb1d5be09218621e1efaa1ade2d66f87 --- /dev/null +++ b/annotations_filtered/jc2T3qbPJNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [9.0, 8.56], [9.0, 9.04], [9.0, 9.07], [9.0, 30.54], [35.0, 56.57], [59.0, 61.16], [62.0, 66.23], [73.0, 73.36], [75.0, 75.09], [77.0, 78.21], [84.0, 84.28], [87.0, 86.97], [88.0, 88.84], [90.0, 92.4], [94.0, 95.39], [98.0, 108.65], [111.0, 124.53]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.54, 30.0, 32.56, 30.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.93, 0.0, 29.66, 29.82], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.58], ["music", 14.47], ["whack, thwack", 4.74]], [["music", 67.57], ["synthesizer", 7.18], ["electronic music", 4.52]], [["music", 29.34], ["hum", 10.66], ["synthesizer", 10.57]], [["music", 53.04], ["throbbing", 6.48], ["hum", 6.45]], null, null, null, null, null, null, [["speech", 26.68], ["whale vocalization", 23.22], ["music", 10.08]], null, [["music", 64.8], ["musical instrument", 7.58], ["livestock, farm animals, working animals", 6.16]], [["whale vocalization", 11.76], ["music", 10.16], ["buzz", 8.28]]], "duration": [0.58, -0.44, 0.04, 0.07, 21.54, 21.57, 2.16, 4.23, 0.36, 0.09, 1.21, 0.28, -0.03, 0.84, 2.4, 1.39, 10.65, 13.53]} \ No newline at end of file diff --git a/annotations_filtered/jc6_XgtOQgI_filtered.json b/annotations_filtered/jc6_XgtOQgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8014e5a725bee6e5439120e608b8beb36062cda4 --- /dev/null +++ b/annotations_filtered/jc6_XgtOQgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [27.0, 27.57], [30.0, 29.96], [33.0, 33.44], [37.0, 53.79], [55.0, 56.0], [56.0, 59.04], [59.0, 64.35]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.3, 0.0, 38.21, 39.75], "audiomae_on_audioset": [null, null, null, null, [["speech", 70.78], ["mains hum", 6.27], ["hum", 4.66]], null, [["music", 22.33], ["moo", 19.55], ["cattle, bovinae", 18.9]], [["music", 38.59], ["horse", 9.33], ["clip-clop", 6.93]]], "duration": [1.12, 0.57, -0.04, 0.44, 16.79, 1.0, 3.04, 5.35]} \ No newline at end of file diff --git a/annotations_filtered/jcNFjpxU0E8_filtered.json b/annotations_filtered/jcNFjpxU0E8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55df4f022a6079cc861019be81a2fcb2c3fbd84b --- /dev/null +++ b/annotations_filtered/jcNFjpxU0E8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.89], [9.0, 11.06], [13.0, 13.36], [15.0, 14.99], [15.0, 16.5], [19.0, 28.66], [29.0, 29.46], [31.0, 31.35], [33.0, 33.49], [34.0, 35.46], [35.0, 35.51], [36.0, 35.92], [37.0, 45.37], [47.0, 51.04], [52.0, 60.15], [62.0, 65.74], [68.0, 75.09], [77.0, 78.51], [79.0, 79.56], [82.0, 83.71], [85.0, 86.44], [87.0, 87.94], [88.0, 92.3], [100.0, 101.11], [103.0, 103.42], [116.0, 118.44], [119.0, 121.1], [122.0, 123.13], [125.0, 125.04], [127.0, 128.58], [129.0, 129.81], [131.0, 132.63]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 33.24, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.53, 45.05, 35.29, 37.69, 40.93, 0.0, 0.0, 0.0, 0.0, 0.0, 35.85, 0.0, 0.0, 38.59, 34.42, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 14.77], ["fly, housefly", 9.52], ["speech", 7.09]], null, null, null, [["music", 58.17], ["musical instrument", 12.79], ["synthesizer", 6.92]], null, null, null, null, null, null, [["music", 49.67], ["brass instrument", 17.13], ["trumpet", 15.08]], [["insect", 36.87], ["fly, housefly", 29.34], ["bee, wasp, etc.", 11.12]], [["sidetone", 20.53], ["fly, housefly", 15.08], ["speech", 14.71]], [["stomach rumble", 8.56], ["insect", 8.05], ["patter", 7.49]], [["hum", 13.86], ["speech", 7.0], ["fly, housefly", 6.42]], null, null, null, null, null, [["fly, housefly", 32.81], ["insect", 24.55], ["speech", 19.98]], null, null, [["speech", 37.38], ["frog", 16.97], ["mains hum", 13.1]], [["fly, housefly", 31.09], ["insect", 18.65], ["bee, wasp, etc.", 13.05]], null, null, null, null, null], "duration": [1.89, 2.06, 0.36, -0.01, 1.5, 9.66, 0.46, 0.35, 0.49, 1.46, 0.51, -0.08, 8.37, 4.04, 8.15, 3.74, 7.09, 1.51, 0.56, 1.71, 1.44, 0.94, 4.3, 1.11, 0.42, 2.44, 2.1, 1.13, 0.04, 1.58, 0.81, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/jcTv-BEwabk_filtered.json b/annotations_filtered/jcTv-BEwabk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..473b6bf556648f0801ff87a5b5487644b3617bf7 --- /dev/null +++ b/annotations_filtered/jcTv-BEwabk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [8.0, 8.88], [19.0, 19.94], [23.0, 23.87], [27.0, 28.73], [31.0, 31.58], [34.0, 35.4], [37.0, 38.37], [40.0, 40.42], [44.0, 45.45], [47.0, 47.78], [52.0, 52.47], [54.0, 55.46], [57.0, 58.28], [62.0, 63.63], [64.0, 65.74], [69.0, 69.69], [71.0, 72.18], [73.0, 73.89], [75.0, 75.78], [76.0, 76.18], [77.0, 77.8], [79.0, 80.16], [81.0, 82.0], [85.0, 87.45], [90.0, 90.31], [94.0, 94.86], [101.0, 101.56], [105.0, 105.56], [109.0, 109.16], [111.0, 112.36], [113.0, 114.56], [118.0, 117.95], [119.0, 119.38], [122.0, 123.18], [124.0, 124.9], [126.0, 126.42], [128.0, 128.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 0.88, 0.94, 0.87, 1.73, 0.58, 1.4, 1.37, 0.42, 1.45, 0.78, 0.47, 1.46, 1.28, 1.63, 1.74, 0.69, 1.18, 0.89, 0.78, 0.18, 0.8, 1.16, 1.0, 2.45, 0.31, 0.86, 0.56, 0.56, 0.16, 1.36, 1.56, -0.05, 0.38, 1.18, 0.9, 0.42, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/jcmTZfv5z-k_filtered.json b/annotations_filtered/jcmTZfv5z-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1551a5c0614d23b66b664cd93c1debd0b4b1e27e --- /dev/null +++ b/annotations_filtered/jcmTZfv5z-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 23.09]], "keep_status": [true], "silence_prob": [31.52], "audiomae_on_audioset": [[["hum", 23.23], ["music", 13.28], ["mains hum", 6.67]]], "duration": [22.09]} \ No newline at end of file diff --git a/annotations_filtered/jd3KM4imjr4_filtered.json b/annotations_filtered/jd3KM4imjr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f2686d08f9fccef696689a160b43300aacca0d2 --- /dev/null +++ b/annotations_filtered/jd3KM4imjr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.87], [34.0, 39.68], [49.0, 55.92], [59.0, 60.13], [63.0, 63.66], [64.0, 64.88], [73.0, 74.04], [80.0, 80.69], [81.0, 82.88], [84.0, 89.63], [90.0, 91.83], [93.0, 94.24], [97.0, 98.52]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 81.71, 33.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["thunk", 18.76], ["fly, housefly", 12.48], ["livestock, farm animals, working animals", 11.24]], null, null, null, null, null, null, null, null, null, null], "duration": [15.87, 5.68, 6.92, 1.13, 0.66, 0.88, 1.04, 0.69, 1.88, 5.63, 1.83, 1.24, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/jd4tpvAcKYA_filtered.json b/annotations_filtered/jd4tpvAcKYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27efa9ac0c6587a76a369553dd13cd370e49c3ce --- /dev/null +++ b/annotations_filtered/jd4tpvAcKYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.16], [7.0, 7.21], [8.0, 8.9], [9.0, 9.93], [10.0, 11.57], [12.0, 13.74], [17.0, 17.52], [22.0, 22.18], [24.0, 24.46], [25.0, 25.81], [27.0, 27.36], [28.0, 29.59], [32.0, 32.04], [33.0, 34.13], [35.0, 35.36], [36.0, 38.84], [40.0, 41.05], [44.0, 44.29], [48.0, 48.95], [53.0, 54.77], [56.0, 56.47], [60.0, 62.87], [64.0, 65.6], [68.0, 69.06], [71.0, 71.69], [74.0, 74.61], [76.0, 76.57], [78.0, 78.39], [80.0, 80.3], [81.0, 81.84], [83.0, 83.51], [90.0, 90.93], [91.0, 93.87], [95.0, 96.21], [97.0, 97.8], [99.0, 98.78], [100.0, 100.63], [106.0, 106.78], [109.0, 109.11], [113.0, 113.86], [114.0, 116.78], [121.0, 123.97], [127.0, 127.52], [130.0, 131.87], [135.0, 136.0], [137.0, 139.21], [140.0, 140.86], [142.0, 143.01], [149.0, 149.5], [151.0, 151.28], [152.0, 153.49], [154.0, 159.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 99.84, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.21, 0.9, 0.93, 1.57, 1.74, 0.52, 0.18, 0.46, 0.81, 0.36, 1.59, 0.04, 1.13, 0.36, 2.84, 1.05, 0.29, 0.95, 1.77, 0.47, 2.87, 1.6, 1.06, 0.69, 0.61, 0.57, 0.39, 0.3, 0.84, 0.51, 0.93, 2.87, 1.21, 0.8, -0.22, 0.63, 0.78, 0.11, 0.86, 2.78, 2.97, 0.52, 1.87, 1.0, 2.21, 0.86, 1.01, 0.5, 0.28, 1.49, 5.66]} \ No newline at end of file diff --git a/annotations_filtered/jdZ6RA_c6oE_filtered.json b/annotations_filtered/jdZ6RA_c6oE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36524b7f40f51cb1446c5ab103ef3e60b79fbd99 --- /dev/null +++ b/annotations_filtered/jdZ6RA_c6oE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [5.0, 4.68], [9.0, 9.39], [11.0, 11.8], [39.0, 39.39], [45.0, 47.06], [48.0, 55.95], [59.0, 59.14], [60.0, 61.62], [63.0, 67.17]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 38.68, 0.0, 0.0, 34.44], "audiomae_on_audioset": [null, null, null, null, null, null, [["crowd", 46.34], ["cheering", 20.22], ["speech", 15.31]], null, null, [["speech", 29.36], ["crowd", 11.16], ["sheep", 9.17]]], "duration": [1.08, -0.32, 0.39, 0.8, 0.39, 2.06, 7.95, 0.14, 1.62, 4.17]} \ No newline at end of file diff --git a/annotations_filtered/jdd1py-ilwc_filtered.json b/annotations_filtered/jdd1py-ilwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ecb3d17d0606713bda21acb9e0e23355200d035 --- /dev/null +++ b/annotations_filtered/jdd1py-ilwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.43], [23.0, 24.22], [25.0, 26.4], [31.0, 31.75], [33.0, 33.44], [37.0, 38.1], [41.0, 42.06], [45.0, 45.89], [47.0, 47.49], [52.0, 52.93], [62.0, 66.53], [77.0, 88.53], [89.0, 90.8], [94.0, 105.85], [113.0, 112.68], [114.0, 117.39], [122.0, 125.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 37.24, 0.0, 46.05, 0.0, 77.7, 34.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 63.79], ["animal", 3.88], ["dog", 3.76]], [["music", 63.99], ["didgeridoo", 14.48], ["speech", 13.21]], null, [["music", 66.77], ["synthesizer", 5.17], ["ding", 3.02]], null, null, [["speech", 37.01], ["music", 28.57], ["musical instrument", 4.0]]], "duration": [3.43, 1.22, 1.4, 0.75, 0.44, 1.1, 1.06, 0.89, 0.49, 0.93, 4.53, 11.53, 1.8, 11.85, -0.32, 3.39, 3.17]} \ No newline at end of file diff --git a/annotations_filtered/jeYdR_r0iGo_filtered.json b/annotations_filtered/jeYdR_r0iGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f567873396044dcbd5fc951f24938253f5018246 --- /dev/null +++ b/annotations_filtered/jeYdR_r0iGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.37], [22.0, 23.97], [25.0, 27.5], [30.0, 31.28], [34.0, 34.69], [36.0, 36.02], [39.0, 39.34], [47.0, 48.07], [49.0, 58.06], [61.0, 61.45], [70.0, 104.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 50.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [5.37, 1.97, 2.5, 1.28, 0.69, 0.02, 0.34, 1.07, 9.06, 0.45, 34.19]} \ No newline at end of file diff --git a/annotations_filtered/jeoUH00woxs_filtered.json b/annotations_filtered/jeoUH00woxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89dafb736c8d99cd4613a5ef6e5bbdc5f4827418 --- /dev/null +++ b/annotations_filtered/jeoUH00woxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.81], [7.0, 8.95], [10.0, 11.42], [15.0, 15.53], [16.0, 16.19], [17.0, 19.85], [22.0, 22.49], [27.0, 27.46], [29.0, 30.23], [31.0, 32.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.81, 1.95, 1.42, 0.53, 0.19, 2.85, 0.49, 0.46, 1.23, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/jepTSaMF2ZM_filtered.json b/annotations_filtered/jepTSaMF2ZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73e40e94dcf189750678535b0e8a8921fb68e03c --- /dev/null +++ b/annotations_filtered/jepTSaMF2ZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [6.0, 6.91], [14.0, 14.47], [36.0, 36.24], [38.0, 40.49], [41.0, 54.6], [57.0, 60.86], [73.0, 74.46], [76.0, 77.4], [78.0, 83.57], [89.0, 90.34], [91.0, 93.23], [95.0, 96.82], [100.0, 100.35], [105.0, 105.7], [106.0, 107.92], [110.0, 112.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 100.0, 97.73, 70.02, 0.0, 0.0, 55.11, 0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 47.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.28], ["synthesizer", 15.93], ["musical instrument", 3.89]]], "duration": [2.11, 0.91, 0.47, 0.24, 2.49, 13.6, 3.86, 1.46, 1.4, 5.57, 1.34, 2.23, 1.82, 0.35, 0.7, 1.92, 2.31]} \ No newline at end of file diff --git a/annotations_filtered/jf9d3cwVWBY_filtered.json b/annotations_filtered/jf9d3cwVWBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b634a8366a7616ac4f2c4d63fd7cdc3d97e40d6f --- /dev/null +++ b/annotations_filtered/jf9d3cwVWBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.67], [87.0, 87.56], [108.0, 109.95], [113.0, 113.0]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.67, 0.56, 1.95, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/jfA6jr-y7_A_filtered.json b/annotations_filtered/jfA6jr-y7_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca35ab9db77c57046493e65c128096d2b31acd13 --- /dev/null +++ b/annotations_filtered/jfA6jr-y7_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.31], [18.0, 18.12], [24.0, 25.25], [37.0, 37.45], [52.0, 52.05], [57.0, 59.27], [62.0, 62.65], [64.0, 64.86], [68.0, 70.07], [75.0, 74.85], [79.0, 80.54], [81.0, 81.62], [83.0, 83.81], [88.0, 93.14], [94.0, 99.27], [104.0, 104.03], [112.0, 111.84], [112.0, 124.82], [129.0, 129.64], [138.0, 141.32], [141.0, 141.42]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 42.86, 0.0, 0.0, 0.0, 0.0, 29.55, 29.71, 0.0, 0.0, 32.17, 0.0, 40.11, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fart", 54.26], ["speech", 15.71], ["burping, eructation", 5.7]], null, null, [["sidetone", 26.36], ["speech", 23.34], ["music", 10.5]], null, null, null, null, [["music", 51.86], ["musical instrument", 8.85], ["synthesizer", 7.83]], [["music", 64.19], ["electronic music", 9.34], ["speech", 4.76]], null, null, [["music", 52.62], ["speech", 28.65], ["electronic music", 3.88]], null, [["speech", 87.95], ["inside, small room", 2.07], ["music", 1.24]], null], "duration": [1.31, 0.12, 1.25, 0.45, 0.05, 2.27, 0.65, 0.86, 2.07, -0.15, 1.54, 0.62, 0.81, 5.14, 5.27, 0.03, -0.16, 12.82, 0.64, 3.32, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/jfYvV2tBEz0_filtered.json b/annotations_filtered/jfYvV2tBEz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d477ae79530ccfd3b556259c9ed1bd426bd1148a --- /dev/null +++ b/annotations_filtered/jfYvV2tBEz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.82], [17.0, 52.17], [53.0, 58.92], [59.0, 60.18], [61.0, 62.06], [63.0, 86.58]], "keep_status": [false, false, false, false, false, false], "silence_prob": [56.93, 0.0, 99.85, 0.0, 0.0, 87.19], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [7.82, 35.17, 5.92, 1.18, 1.06, 23.58]} \ No newline at end of file diff --git a/annotations_filtered/jfgWw43Fcuw_filtered.json b/annotations_filtered/jfgWw43Fcuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25f5995ebf969f91326cba2715fa17b19cfb8de7 --- /dev/null +++ b/annotations_filtered/jfgWw43Fcuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 80.54], [89.0, 98.37], [98.0, 98.98], [101.0, 101.55], [106.0, 125.66], [126.0, 127.26]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 30.22, 0.0, 0.0, 28.83, 0.0], "audiomae_on_audioset": [null, [["speech", 42.62], ["music", 23.15], ["theremin", 2.74]], null, null, [["speech", 49.38], ["music", 20.14], ["sound effect", 3.3]], null], "duration": [0.54, 9.37, 0.98, 0.55, 19.66, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/jfhEIIK-jB8_filtered.json b/annotations_filtered/jfhEIIK-jB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5590bc869c913da6ea6d685f474467c4b66cc652 --- /dev/null +++ b/annotations_filtered/jfhEIIK-jB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 4.41], [8.0, 9.98], [17.0, 17.17], [19.0, 19.85], [34.0, 34.13], [35.0, 35.72], [39.0, 39.78], [41.0, 42.35], [43.0, 43.9], [45.0, 47.06], [54.0, 55.02], [58.0, 64.52], [70.0, 84.72], [87.0, 101.88], [105.0, 105.9], [107.0, 108.16], [109.0, 114.61], [118.0, 146.48], [149.0, 179.12], [185.0, 191.71], [201.0, 216.33], [219.0, 222.3], [223.0, 224.06], [225.0, 229.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 33.63, 29.63, 28.42, 0.0, 0.0, 28.5, 27.94, 0.0, 29.73, 28.67, 94.07, 0.0, 61.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.84], ["music", 34.05], ["thunk", 12.08]], [["music", 53.48], ["throbbing", 12.64], ["hum", 10.28]], [["music", 62.45], ["synthesizer", 10.71], ["musical instrument", 4.78]], null, null, [["music", 66.33], ["throbbing", 7.15], ["didgeridoo", 5.05]], [["music", 67.63], ["speech", 16.02], ["theremin", 2.3]], null, [["speech", 31.96], ["music", 23.1], ["buzz", 8.06]], [["music", 32.51], ["mains hum", 7.98], ["hum", 6.49]], null, null, null], "duration": [0.13, 0.41, 1.98, 0.17, 0.85, 0.13, 0.72, 0.78, 1.35, 0.9, 2.06, 1.02, 6.52, 14.72, 14.88, 0.9, 1.16, 5.61, 28.48, 30.12, 6.71, 15.33, 3.3, 1.06, 4.63]} \ No newline at end of file diff --git a/annotations_filtered/jgBGoS4a5rc_filtered.json b/annotations_filtered/jgBGoS4a5rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da9a43b822d2cb18b028a9e75a351d34b7fa64b5 --- /dev/null +++ b/annotations_filtered/jgBGoS4a5rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.45], [13.0, 17.05], [18.0, 19.14], [22.0, 21.69], [23.0, 26.5], [28.0, 28.41], [31.0, 31.82], [33.0, 32.93], [35.0, 35.09], [40.0, 41.72], [46.0, 46.36], [48.0, 51.16], [54.0, 55.27], [57.0, 58.09], [59.0, 58.82], [60.0, 60.35], [61.0, 70.77], [81.0, 81.65], [90.0, 90.49], [93.0, 95.5], [98.0, 99.13], [107.0, 107.77], [110.0, 110.93], [112.0, 112.02], [115.0, 116.16], [118.0, 119.31], [121.0, 122.5], [125.0, 127.06], [131.0, 131.4], [132.0, 132.27], [133.0, 133.12], [133.0, 134.13], [135.0, 135.9], [136.0, 154.65], [158.0, 159.8], [163.0, 165.08], [171.0, 174.72], [177.0, 182.49], [184.0, 184.67]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [47.27, 46.57, 0.0, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 50.16, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 32.38, 31.33, 30.98, 0.0], "audiomae_on_audioset": [[["music", 14.67], ["burping, eructation", 13.82], ["sine wave", 13.45]], [["speech", 55.06], ["gears", 3.85], ["mechanisms", 3.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 39.46], ["hum", 18.08], ["music", 12.13]], null, null, null, null, null, [["music", 51.59], ["speech", 16.0], ["synthesizer", 7.23]], null, [["music", 48.03], ["throbbing", 8.84], ["drum machine", 7.7]], [["music", 66.51], ["electronic music", 9.18], ["dubstep", 6.0]], [["music", 75.85], ["electronic music", 2.69], ["speech", 2.53]], null], "duration": [4.45, 4.05, 1.14, -0.31, 3.5, 0.41, 0.82, -0.07, 0.09, 1.72, 0.36, 3.16, 1.27, 1.09, -0.18, 0.35, 9.77, 0.65, 0.49, 2.5, 1.13, 0.77, 0.93, 0.02, 1.16, 1.31, 1.5, 2.06, 0.4, 0.27, 0.12, 1.13, 0.9, 18.65, 1.8, 2.08, 3.72, 5.49, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/jgOMHLuBup4_filtered.json b/annotations_filtered/jgOMHLuBup4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f812359a390cc85c71b90200ca780c7eb09037 --- /dev/null +++ b/annotations_filtered/jgOMHLuBup4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.68], [23.0, 31.75], [33.0, 52.39], [53.0, 54.19], [55.0, 61.15], [62.0, 71.1], [72.0, 73.99], [77.0, 85.38], [87.0, 88.86], [97.0, 99.5], [101.0, 101.29], [103.0, 103.81], [107.0, 108.45]], "keep_status": [false, false, false, false, true, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 49.92, 32.39, 0.0, 36.6, 35.4, 0.0, 33.56, 0.0, 32.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.53], ["throbbing", 23.88], ["hum", 21.56]], [["music", 36.94], ["throbbing", 32.45], ["speech", 11.92]], null, [["hum", 24.98], ["music", 20.63], ["throbbing", 15.94]], [["music", 21.49], ["speech", 20.47], ["throbbing", 14.41]], null, [["music", 26.23], ["speech", 20.26], ["throbbing", 11.48]], null, [["music", 39.13], ["speech", 14.44], ["musical instrument", 2.7]], null, null, null], "duration": [0.68, 8.75, 19.39, 1.19, 6.15, 9.1, 1.99, 8.38, 1.86, 2.5, 0.29, 0.81, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/jgcD-DHpPR0_filtered.json b/annotations_filtered/jgcD-DHpPR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fe1fb1195497de97f0863f910e71166cd03d875 --- /dev/null +++ b/annotations_filtered/jgcD-DHpPR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[83.0, 83.46], [86.0, 87.56], [90.0, 91.5], [93.0, 92.92], [96.0, 103.42], [105.0, 105.88], [108.0, 109.49], [112.0, 112.02], [114.0, 114.17], [115.0, 115.52], [117.0, 117.86], [119.0, 120.39], [121.0, 121.54], [127.0, 126.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.56, 1.5, -0.08, 7.42, 0.88, 1.49, 0.02, 0.17, 0.52, 0.86, 1.39, 0.54, -0.31]} \ No newline at end of file diff --git a/annotations_filtered/jgk96izcJbw_filtered.json b/annotations_filtered/jgk96izcJbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6741e8bcb89549bc509807bdda6aefb3c05a5059 --- /dev/null +++ b/annotations_filtered/jgk96izcJbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.84], [10.0, 10.79], [15.0, 33.54], [34.0, 37.15], [41.0, 43.95], [45.0, 46.23], [47.0, 69.11], [72.0, 100.48], [102.0, 149.1]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.53, 50.61, 77.36, 0.0, 31.45, 29.4, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.53], ["speech", 10.23], ["hum", 8.81]], null, null, null, [["throbbing", 30.89], ["music", 29.81], ["hum", 14.54]], [["throbbing", 36.48], ["hum", 35.54], ["music", 16.35]], null], "duration": [0.84, 0.79, 18.54, 3.15, 2.95, 1.23, 22.11, 28.48, 47.1]} \ No newline at end of file diff --git a/annotations_filtered/jgosH8zc83Q_filtered.json b/annotations_filtered/jgosH8zc83Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34de6f5a7ee7c7ef80a1a06297011ed149ecd191 --- /dev/null +++ b/annotations_filtered/jgosH8zc83Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [6.0, 7.16], [8.0, 8.51], [10.0, 11.84], [13.0, 13.02], [15.0, 17.64], [19.0, 20.09], [27.0, 27.51], [29.0, 29.52], [31.0, 31.16], [32.0, 35.58], [39.0, 39.63], [40.0, 41.42], [44.0, 44.04], [45.0, 44.93], [46.0, 46.3], [46.0, 46.77], [52.0, 52.84], [54.0, 54.95], [58.0, 59.29], [61.0, 61.48], [62.0, 62.7], [63.0, 63.95], [64.0, 64.91], [66.0, 65.87], [66.0, 67.56], [69.0, 69.85], [73.0, 87.56], [89.0, 90.12], [93.0, 93.31], [95.0, 95.3], [96.0, 96.92], [98.0, 98.78], [101.0, 101.93], [105.0, 105.46], [106.0, 106.73], [109.0, 111.43], [116.0, 116.46], [118.0, 118.72], [120.0, 120.19], [125.0, 125.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mains hum", 20.41], ["hum", 18.47], ["music", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.88], ["foghorn", 5.62], ["brass instrument", 5.21]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.16, 0.51, 1.84, 0.02, 2.64, 1.09, 0.51, 0.52, 0.16, 3.58, 0.63, 1.42, 0.04, -0.07, 0.3, 0.77, 0.84, 0.95, 1.29, 0.48, 0.7, 0.95, 0.91, -0.13, 1.56, 0.85, 14.56, 1.12, 0.31, 0.3, 0.92, 0.78, 0.93, 0.46, 0.73, 2.43, 0.46, 0.72, 0.19, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/jgvj0XwxagY_filtered.json b/annotations_filtered/jgvj0XwxagY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc5da0f3aed60d4bb942639adc9e265aa322f170 --- /dev/null +++ b/annotations_filtered/jgvj0XwxagY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 72.12]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [69.12]} \ No newline at end of file diff --git a/annotations_filtered/jh_EME9M-mg_filtered.json b/annotations_filtered/jh_EME9M-mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fb92a8487641ef380b35c8004bccbbc1b0c8646 --- /dev/null +++ b/annotations_filtered/jh_EME9M-mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 39.09], [40.0, 40.61], [42.0, 57.0], [60.0, 60.96], [64.0, 65.62], [67.0, 69.9], [75.0, 84.97], [87.0, 87.35]], "keep_status": [true, false, false, false, false, true, true, false], "silence_prob": [43.9, 0.0, 68.8, 0.0, 0.0, 39.64, 37.02, 0.0], "audiomae_on_audioset": [[["speech", 35.25], ["animal", 7.72], ["fart", 4.48]], null, null, null, null, [["speech", 27.29], ["sidetone", 20.35], ["music", 6.27]], [["music", 33.96], ["pant", 17.45], ["beatboxing", 5.83]], null], "duration": [14.09, 0.61, 15.0, 0.96, 1.62, 2.9, 9.97, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/ji4pvRXDMOY_filtered.json b/annotations_filtered/ji4pvRXDMOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b16fba88ff3c6619e402f36c8bec89819cca09 --- /dev/null +++ b/annotations_filtered/ji4pvRXDMOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [6.0, 6.93], [8.0, 8.97], [15.0, 21.09], [24.0, 28.61], [29.0, 29.52], [30.0, 32.24], [35.0, 35.26], [39.0, 40.76], [43.0, 42.9], [63.0, 63.8], [64.0, 64.07], [64.0, 64.29], [66.0, 66.11], [68.0, 67.88], [68.0, 68.74], [69.0, 77.65], [83.0, 82.92], [85.0, 91.99]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.71, 63.42, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.53, 0.0, 49.09], "audiomae_on_audioset": [null, null, null, [["music", 47.0], ["didgeridoo", 14.72], ["speech", 10.13]], null, null, [["boing", 28.93], ["baby laughter", 21.32], ["giggle", 12.68]], null, null, null, null, null, null, null, null, null, [["speech", 34.11], ["boing", 25.23], ["music", 9.88]], null, [["rumble", 21.45], ["hum", 13.83], ["music", 12.86]]], "duration": [1.19, 0.93, 0.97, 6.09, 4.61, 0.52, 2.24, 0.26, 1.76, -0.1, 0.8, 0.07, 0.29, 0.11, -0.12, 0.74, 8.65, -0.08, 6.99]} \ No newline at end of file diff --git a/annotations_filtered/ji9C_R6HLvg_filtered.json b/annotations_filtered/ji9C_R6HLvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae8edea5dd07816d6da5825ea6871ff6cf6332cb --- /dev/null +++ b/annotations_filtered/ji9C_R6HLvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.57], [7.0, 10.79], [12.0, 12.39], [13.0, 14.01], [17.0, 17.15], [28.0, 28.9], [38.0, 37.94], [39.0, 41.34], [43.0, 43.85], [45.0, 45.45], [47.0, 50.8], [63.0, 75.68], [77.0, 78.48], [80.0, 82.65], [84.0, 87.3], [88.0, 89.75], [92.0, 122.22], [129.0, 130.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 31.19, 99.59, 0.0, 97.22, 99.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sidetone", 34.79], ["speech", 31.8], ["music", 8.48]], null, null, null, null, null, null, null], "duration": [1.57, 3.79, 0.39, 1.01, 0.15, 0.9, -0.06, 2.34, 0.85, 0.45, 3.8, 12.68, 1.48, 2.65, 3.3, 1.75, 30.22, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/jiHXahhmzjw_filtered.json b/annotations_filtered/jiHXahhmzjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f5cec812587d2828a802d92df353876ae56d2fc --- /dev/null +++ b/annotations_filtered/jiHXahhmzjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.6], [15.0, 16.34], [17.0, 17.34], [20.0, 21.42], [24.0, 39.24], [41.0, 46.33], [47.0, 47.06], [49.0, 49.55], [55.0, 55.71], [57.0, 58.04], [63.0, 63.22], [67.0, 68.23], [75.0, 75.57], [78.0, 78.22], [84.0, 85.55], [88.0, 89.43], [106.0, 106.91], [109.0, 110.61], [114.0, 114.51], [119.0, 119.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.6, 1.34, 0.34, 1.42, 15.24, 5.33, 0.06, 0.55, 0.71, 1.04, 0.22, 1.23, 0.57, 0.22, 1.55, 1.43, 0.91, 1.61, 0.51, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/jiP6PiKJLUs_filtered.json b/annotations_filtered/jiP6PiKJLUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d6754adf65e30b7d5642989bad33fc710895de --- /dev/null +++ b/annotations_filtered/jiP6PiKJLUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 22.65], [24.0, 24.6], [31.0, 31.78], [36.0, 36.73], [43.0, 43.09], [45.0, 46.33], [47.0, 50.5], [58.0, 74.98], [76.0, 76.15], [77.0, 76.84], [80.0, 82.65], [84.0, 87.17], [88.0, 92.45], [93.0, 96.43], [97.0, 110.34], [114.0, 122.94], [128.0, 128.61], [130.0, 130.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [33.65, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4, 36.64, 0.0, 0.0, 40.82, 100.0, 100.0, 93.6, 35.46, 31.98, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.51], ["theremin", 12.54], ["synthesizer", 4.52]], null, null, null, null, null, [["speech", 81.04], ["radio", 9.05], ["sidetone", 4.25]], [["music", 62.64], ["synthesizer", 9.44], ["musical instrument", 6.71]], null, null, [["dog", 12.99], ["speech", 11.71], ["animal", 9.97]], null, null, null, [["music", 34.64], ["speech", 20.0], ["theremin", 15.01]], [["speech", 27.23], ["theremin", 23.45], ["music", 9.03]], null, null], "duration": [12.65, 0.6, 0.78, 0.73, 0.09, 1.33, 3.5, 16.98, 0.15, -0.16, 2.65, 3.17, 4.45, 3.43, 13.34, 8.94, 0.61, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/jihDFIqNz1s_filtered.json b/annotations_filtered/jihDFIqNz1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..432fd6ad32b078bb1b537f4a609e55192a903c85 --- /dev/null +++ b/annotations_filtered/jihDFIqNz1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [9.0, 10.0], [11.0, 17.64], [19.0, 20.9], [24.0, 24.46], [26.0, 26.6], [27.0, 28.98], [31.0, 31.02], [34.0, 37.44], [38.0, 40.54], [44.0, 47.51], [50.0, 50.45], [52.0, 52.96], [54.0, 54.82], [56.0, 57.25], [59.0, 59.95], [63.0, 64.03], [66.0, 66.19], [69.0, 69.45], [71.0, 71.27], [72.0, 72.86], [76.0, 77.11], [79.0, 79.29], [81.0, 82.04], [83.0, 84.15], [85.0, 85.7], [90.0, 95.3], [96.0, 97.01], [98.0, 100.53], [105.0, 105.09], [106.0, 107.4], [110.0, 112.33], [113.0, 113.51], [115.0, 115.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 99.16, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.0, 6.64, 1.9, 0.46, 0.6, 1.98, 0.02, 3.44, 2.54, 3.51, 0.45, 0.96, 0.82, 1.25, 0.95, 1.03, 0.19, 0.45, 0.27, 0.86, 1.11, 0.29, 1.04, 1.15, 0.7, 5.3, 1.01, 2.53, 0.09, 1.4, 2.33, 0.51, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/jj1lH26Ky08_filtered.json b/annotations_filtered/jj1lH26Ky08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af82a04941f63dff452add54fc7889e7902428e --- /dev/null +++ b/annotations_filtered/jj1lH26Ky08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [3.0, 3.91], [5.0, 5.37], [8.0, 8.45], [10.0, 11.15], [12.0, 12.83], [14.0, 14.37], [15.0, 15.62], [17.0, 18.81], [20.0, 20.68], [21.0, 21.73], [23.0, 26.62], [27.0, 67.05], [68.0, 70.38], [71.0, 71.83], [73.0, 92.99], [95.0, 96.85], [98.0, 101.43], [102.0, 102.46], [104.0, 116.09], [119.0, 121.05], [122.0, 125.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 73.51, 0.0, 49.22, 0.0, 90.25, 0.0, 73.06, 68.93, 49.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["telephone", 73.97], ["telephone bell ringing", 19.27], ["telephone dialing, dtmf", 1.9]], null, null, null, null, null, [["speech", 42.68], ["mains hum", 18.88], ["hum", 13.6]]], "duration": [0.51, 0.91, 0.37, 0.45, 1.15, 0.83, 0.37, 0.62, 1.81, 0.68, 0.73, 3.62, 40.05, 2.38, 0.83, 19.99, 1.85, 3.43, 0.46, 12.09, 2.05, 3.22]} \ No newline at end of file diff --git a/annotations_filtered/jj6ECLiWbxo_filtered.json b/annotations_filtered/jj6ECLiWbxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6df9933e071c83df6b92cf51ca1e6d295db72034 --- /dev/null +++ b/annotations_filtered/jj6ECLiWbxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [8.0, 10.39], [13.0, 13.07], [15.0, 15.77], [17.0, 19.47], [22.0, 22.79], [27.0, 28.59], [31.0, 33.07], [33.0, 38.33], [41.0, 42.43], [55.0, 56.64], [59.0, 60.22], [61.0, 63.1], [63.0, 66.72], [67.0, 67.88]], "keep_status": [true, true, false, false, true, false, false, false, true, false, false, false, false, true, false], "silence_prob": [47.9, 48.19, 0.0, 0.0, 44.23, 0.0, 0.0, 51.34, 42.84, 0.0, 0.0, 0.0, 52.05, 43.1, 0.0], "audiomae_on_audioset": [[["hum", 27.28], ["music", 26.23], ["speech", 11.09]], [["music", 37.38], ["ambient music", 12.58], ["hum", 10.31]], null, null, [["music", 30.61], ["pulse", 13.23], ["hum", 11.05]], null, null, null, [["music", 27.68], ["speech", 17.64], ["didgeridoo", 10.28]], null, null, null, null, [["music", 46.3], ["speech", 11.62], ["singing bowl", 8.41]], null], "duration": [2.66, 2.39, 0.07, 0.77, 2.47, 0.79, 1.59, 2.07, 5.33, 1.43, 1.64, 1.22, 2.1, 3.72, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/jj7BRKHml8g_filtered.json b/annotations_filtered/jj7BRKHml8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46beaa99bb65d6dbd11e4e9b5eb3c497d6c1bfa1 --- /dev/null +++ b/annotations_filtered/jj7BRKHml8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 53.89], [55.0, 70.26], [76.0, 84.69]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.12, 30.04], "audiomae_on_audioset": [null, [["music", 68.82], ["electronic music", 6.51], ["synthesizer", 3.32]], [["music", 80.05], ["throbbing", 4.61], ["didgeridoo", 3.05]]], "duration": [0.89, 15.26, 8.69]} \ No newline at end of file diff --git a/annotations_filtered/jjDuR4d7Iik_filtered.json b/annotations_filtered/jjDuR4d7Iik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a97d5984ed55b29ee34a89ebe227dc233d071db7 --- /dev/null +++ b/annotations_filtered/jjDuR4d7Iik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.84], [26.0, 27.46], [31.0, 32.63], [56.0, 56.51], [64.0, 63.78], [69.0, 74.12], [77.0, 77.6], [81.0, 81.31], [84.0, 86.9], [92.0, 93.14], [104.0, 104.04], [109.0, 109.14], [112.0, 112.68], [116.0, 116.14], [116.0, 117.51], [118.0, 119.52], [126.0, 126.87], [144.0, 150.2], [151.0, 152.81], [155.0, 155.76], [158.0, 158.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.46, 1.63, 0.51, -0.22, 5.12, 0.6, 0.31, 2.9, 1.14, 0.04, 0.14, 0.68, 0.14, 1.51, 1.52, 0.87, 6.2, 1.81, 0.76, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/jjPq-r91oB4_filtered.json b/annotations_filtered/jjPq-r91oB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfd79ff37842787eef01675c63aa1c8703337f7f --- /dev/null +++ b/annotations_filtered/jjPq-r91oB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [16.0, 20.39], [21.0, 23.31], [25.0, 27.7], [51.0, 51.49], [54.0, 56.29], [82.0, 83.22], [84.0, 85.67], [86.0, 87.03], [94.0, 97.11], [102.0, 103.79], [106.0, 107.94], [120.0, 119.92], [126.0, 127.62], [129.0, 130.17], [151.0, 160.27], [162.0, 169.26], [171.0, 171.76], [176.0, 176.01], [177.0, 182.63], [190.0, 192.11]], "keep_status": [true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [30.05, 32.43, 85.9, 34.26, 0.0, 32.13, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 43.64, 40.97, 0.0, 0.0, 37.86, 38.94], "audiomae_on_audioset": [[["siren", 24.5], ["emergency vehicle", 23.1], ["police car (siren)", 19.24]], [["whack, thwack", 27.43], ["breaking", 12.65], ["speech", 8.08]], null, [["speech", 28.18], ["music", 13.29], ["hum", 6.45]], null, [["music", 50.83], ["vehicle", 6.44], ["hum", 5.47]], null, null, null, null, null, null, null, null, null, [["music", 52.27], ["theremin", 19.52], ["ambient music", 6.42]], [["music", 56.12], ["ambient music", 16.09], ["theremin", 11.56]], null, null, [["speech", 29.51], ["music", 24.56], ["didgeridoo", 10.16]], [["music", 32.45], ["hum", 13.65], ["throbbing", 7.54]]], "duration": [2.86, 4.39, 2.31, 2.7, 0.49, 2.29, 1.22, 1.67, 1.03, 3.11, 1.79, 1.94, -0.08, 1.62, 1.17, 9.27, 7.26, 0.76, 0.01, 5.63, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/jjpQORCD0ZU_filtered.json b/annotations_filtered/jjpQORCD0ZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..628739a49b26e470f896d3d010a73ebfefef2907 --- /dev/null +++ b/annotations_filtered/jjpQORCD0ZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [7.0, 6.88], [8.0, 8.48], [11.0, 11.45], [13.0, 13.17], [18.0, 18.93], [20.0, 20.98], [22.0, 21.86], [30.0, 30.81], [36.0, 36.14], [39.0, 39.04], [40.0, 40.59], [48.0, 48.0], [51.0, 51.71], [52.0, 52.79], [55.0, 55.9], [58.0, 57.86], [64.0, 64.17], [66.0, 65.82], [67.0, 67.14], [73.0, 73.26], [75.0, 76.55], [79.0, 79.95], [106.0, 107.96], [109.0, 110.25], [118.0, 118.98], [121.0, 122.52], [126.0, 126.99], [128.0, 128.85], [129.0, 130.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, -0.12, 0.48, 0.45, 0.17, 0.93, 0.98, -0.14, 0.81, 0.14, 0.04, 0.59, 0.0, 0.71, 0.79, 0.9, -0.14, 0.17, -0.18, 0.14, 0.26, 1.55, 0.95, 1.96, 1.25, 0.98, 1.52, 0.99, 0.85, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/jjwg2PeDUxM_filtered.json b/annotations_filtered/jjwg2PeDUxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39ad2b7c5a1c82eb4dfe3e2f3b70c9ac345fa691 --- /dev/null +++ b/annotations_filtered/jjwg2PeDUxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.5], [9.0, 10.57], [12.0, 17.37], [23.0, 31.51], [32.0, 33.45], [36.0, 36.73], [38.0, 38.69], [40.0, 42.58], [43.0, 53.32], [54.0, 54.43], [55.0, 55.34], [57.0, 58.19], [62.0, 66.04], [70.0, 70.04], [71.0, 72.03], [74.0, 74.14], [75.0, 75.66], [78.0, 77.68], [78.0, 82.92], [94.0, 102.93], [103.0, 103.82], [104.0, 109.85], [115.0, 127.3], [128.0, 138.25], [141.0, 140.63], [141.0, 142.37], [143.0, 143.29], [145.0, 145.67], [147.0, 149.49], [153.0, 153.94], [154.0, 154.53], [155.0, 173.16], [173.0, 174.07], [175.0, 183.61]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [33.15, 0.0, 33.54, 30.06, 0.0, 0.0, 0.0, 31.22, 29.34, 0.0, 0.0, 0.0, 28.91, 0.0, 0.0, 0.0, 0.0, 0.0, 28.59, 29.32, 0.0, 28.85, 30.99, 28.76, 0.0, 0.0, 0.0, 0.0, 29.05, 0.0, 0.0, 28.93, 0.0, 29.51], "audiomae_on_audioset": [[["didgeridoo", 38.71], ["mains hum", 14.13], ["hum", 12.75]], null, [["music", 20.2], ["throbbing", 15.75], ["speech", 15.18]], [["speech", 23.88], ["hum", 12.54], ["music", 11.59]], null, null, null, [["oink", 12.49], ["beatboxing", 10.08], ["pig", 8.59]], [["speech", 61.24], ["music", 10.87], ["hum", 3.56]], null, null, null, [["music", 48.92], ["speech", 20.21], ["didgeridoo", 14.43]], null, null, null, null, null, [["speech", 40.53], ["buzz", 27.1], ["electric shaver, electric razor", 4.11]], [["music", 53.44], ["throbbing", 6.63], ["electronic music", 4.22]], null, [["speech", 59.31], ["music", 9.22], ["whack, thwack", 6.53]], [["didgeridoo", 22.67], ["music", 22.42], ["hum", 20.31]], [["music", 34.56], ["throbbing", 15.91], ["hum", 9.36]], null, null, null, null, [["music", 62.45], ["speech", 10.79], ["electronic music", 2.45]], null, null, [["music", 49.41], ["speech", 7.41], ["livestock, farm animals, working animals", 7.12]], null, [["grunt", 67.45], ["speech", 5.01], ["groan", 4.99]]], "duration": [4.5, 1.57, 5.37, 8.51, 1.45, 0.73, 0.69, 2.58, 10.32, 0.43, 0.34, 1.19, 4.04, 0.04, 1.03, 0.14, 0.66, -0.32, 4.92, 8.93, 0.82, 5.85, 12.3, 10.25, -0.37, 1.37, 0.29, 0.67, 2.49, 0.94, 0.53, 18.16, 1.07, 8.61]} \ No newline at end of file diff --git a/annotations_filtered/jk2mjuWhQ_0_filtered.json b/annotations_filtered/jk2mjuWhQ_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8e6ec14b217b264ce0a9d9acdf7128bbea4fefe --- /dev/null +++ b/annotations_filtered/jk2mjuWhQ_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.08], [7.0, 15.13], [16.0, 16.9], [19.0, 21.61], [22.0, 31.26], [37.0, 60.61], [61.0, 62.28], [63.0, 72.23], [73.0, 73.67], [75.0, 84.0], [86.0, 88.72], [89.0, 91.34], [93.0, 93.92], [95.0, 113.88], [115.0, 121.02], [124.0, 131.77]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [37.37, 36.14, 0.0, 43.93, 35.27, 32.71, 0.0, 36.1, 0.0, 35.54, 33.42, 32.56, 0.0, 33.36, 35.42, 38.86], "audiomae_on_audioset": [[["music", 19.21], ["throbbing", 15.1], ["hum", 13.81]], [["hum", 50.91], ["music", 18.94], ["throbbing", 10.16]], null, [["music", 42.79], ["throbbing", 17.85], ["hum", 14.72]], [["hum", 22.08], ["mains hum", 18.18], ["music", 11.14]], [["music", 79.19], ["hum", 4.37], ["throbbing", 3.76]], null, [["hum", 54.28], ["mains hum", 17.5], ["speech", 8.13]], null, [["music", 36.98], ["speech", 18.74], ["hum", 17.92]], [["mains hum", 28.98], ["hum", 21.65], ["speech", 15.14]], [["music", 64.13], ["speech", 9.54], ["throbbing", 2.23]], null, [["music", 63.93], ["hum", 5.11], ["coin (dropping)", 4.59]], [["hum", 21.84], ["music", 15.86], ["mains hum", 14.43]], [["hum", 29.94], ["music", 27.26], ["mains hum", 12.57]]], "duration": [2.08, 8.13, 0.9, 2.61, 9.26, 23.61, 1.28, 9.23, 0.67, 9.0, 2.72, 2.34, 0.92, 18.88, 6.02, 7.77]} \ No newline at end of file diff --git a/annotations_filtered/jk3Z-MVoUg4_filtered.json b/annotations_filtered/jk3Z-MVoUg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04434ae451e069906792fd16cf9f2e6f87fec12 --- /dev/null +++ b/annotations_filtered/jk3Z-MVoUg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.15], [26.0, 65.84], [67.0, 101.95], [104.0, 104.16], [104.0, 106.69]], "keep_status": [true, false, false, false, true], "silence_prob": [31.42, 0.0, 0.0, 0.0, 31.44], "audiomae_on_audioset": [[["music", 27.41], ["hum", 14.31], ["mains hum", 9.39]], null, null, null, [["music", 47.36], ["fly, housefly", 5.72], ["mosquito", 3.74]]], "duration": [4.15, 39.84, 34.95, 0.16, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/jkHrHAKwPZk_filtered.json b/annotations_filtered/jkHrHAKwPZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c40e064c0a746c8f13c2ee2a257785a0bcc5d52 --- /dev/null +++ b/annotations_filtered/jkHrHAKwPZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.67], [8.0, 8.75], [11.0, 11.4], [13.0, 14.12], [17.0, 17.79], [19.0, 20.41]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 35.26], ["hum", 23.34], ["speech", 10.14]], null, null, null, null, null], "duration": [3.67, 0.75, 0.4, 1.12, 0.79, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/jki2_TXdG_Q_filtered.json b/annotations_filtered/jki2_TXdG_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9725e255ae5900ee00c54cca6b6c5c0c3832075 --- /dev/null +++ b/annotations_filtered/jki2_TXdG_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [3.0, 4.26], [9.0, 9.39], [12.0, 13.71], [18.0, 22.1], [32.0, 34.28], [38.0, 38.4], [41.0, 44.32], [44.0, 44.36], [86.0, 86.29], [91.0, 112.55], [114.0, 114.4], [117.0, 122.71], [125.0, 127.75], [128.0, 128.76], [130.0, 131.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 39.89, 0.0, 35.22, 0.0, 0.0, 31.4, 0.0, 98.27, 99.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["humming", 86.94], ["vocal music", 3.72], ["music", 2.59]], null, [["music", 64.63], ["guitar", 5.56], ["plucked string instrument", 2.85]], null, null, [["music", 62.3], ["carnatic music", 15.54], ["middle eastern music", 3.67]], null, null, null, null, null], "duration": [0.08, 1.26, 0.39, 1.71, 4.1, 2.28, 0.4, 3.32, 0.36, 0.29, 21.55, 0.4, 5.71, 2.75, 0.76, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/jkmyjHYMH0Q_filtered.json b/annotations_filtered/jkmyjHYMH0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29984b95c4b20cc53ad42dff92d8feb69f7b05c7 --- /dev/null +++ b/annotations_filtered/jkmyjHYMH0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[120.0, 121.68], [123.0, 127.92], [147.0, 147.92], [158.0, 158.65], [169.0, 170.28], [171.0, 173.89]], "keep_status": [false, true, false, false, false, true], "silence_prob": [0.0, 30.88, 0.0, 0.0, 0.0, 40.14], "audiomae_on_audioset": [null, [["music", 45.89], ["synthesizer", 13.2], ["speech", 8.65]], null, null, null, [["music", 32.52], ["sonar", 14.73], ["synthesizer", 13.09]]], "duration": [1.68, 4.92, 0.92, 0.65, 1.28, 2.89]} \ No newline at end of file diff --git a/annotations_filtered/jlCEAJXSwJc_filtered.json b/annotations_filtered/jlCEAJXSwJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef749447f645e36e855442aafdac83bc9e61fece --- /dev/null +++ b/annotations_filtered/jlCEAJXSwJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[134.0, 133.95]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [-0.05]} \ No newline at end of file diff --git a/annotations_filtered/jlFLcKaBLz0_filtered.json b/annotations_filtered/jlFLcKaBLz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfd394db124a036b580fc74903cc90a4a85e7cb3 --- /dev/null +++ b/annotations_filtered/jlFLcKaBLz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.08], [7.0, 7.82], [10.0, 15.26], [17.0, 20.04], [20.0, 21.9], [28.0, 27.9], [29.0, 28.78], [29.0, 31.77], [33.0, 33.25], [36.0, 40.02], [40.0, 42.53], [43.0, 49.96], [51.0, 52.69], [54.0, 55.32], [56.0, 57.3], [60.0, 60.0], [63.0, 63.27], [66.0, 67.58], [70.0, 70.38], [72.0, 72.42], [83.0, 84.7], [88.0, 91.81], [93.0, 100.38], [112.0, 113.98], [116.0, 120.6], [121.0, 121.78], [122.0, 122.99], [124.0, 125.59]], "keep_status": [true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [37.02, 0.0, 36.31, 78.38, 0.0, 0.0, 0.0, 57.56, 0.0, 52.1, 35.73, 39.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.11, 41.54, 0.0, 36.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sine wave", 31.88], ["chirp tone", 19.39], ["singing bowl", 11.5]], null, [["dog", 28.38], ["bow-wow", 12.11], ["animal", 10.73]], null, null, null, null, null, null, null, [["radio", 21.42], ["speech", 20.08], ["sidetone", 14.65]], [["animal", 18.84], ["hum", 15.27], ["mains hum", 8.65]], null, null, null, null, null, null, null, null, null, [["hiccup", 72.64], ["fly, housefly", 7.63], ["insect", 3.79]], [["hum", 18.04], ["bow-wow", 11.67], ["noise", 9.58]], null, [["fly, housefly", 43.59], ["insect", 23.4], ["mosquito", 5.47]], null, null, null], "duration": [2.08, 0.82, 5.26, 3.04, 1.9, -0.1, -0.22, 2.77, 0.25, 4.02, 2.53, 6.96, 1.69, 1.32, 1.3, 0.0, 0.27, 1.58, 0.38, 0.42, 1.7, 3.81, 7.38, 1.98, 4.6, 0.78, 0.99, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/jlYY8xkTXOQ_filtered.json b/annotations_filtered/jlYY8xkTXOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5970e6d5efc5417c70719ece489842f2161d7031 --- /dev/null +++ b/annotations_filtered/jlYY8xkTXOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.29], [7.0, 8.53], [10.0, 9.96], [14.0, 14.18], [15.0, 15.7], [16.0, 16.77], [19.0, 19.3], [20.0, 20.44], [22.0, 21.95], [22.0, 23.16], [23.0, 23.46], [24.0, 24.26], [28.0, 27.85], [30.0, 30.54], [32.0, 32.36], [34.0, 34.28], [36.0, 36.51], [38.0, 38.38], [39.0, 40.46], [42.0, 41.88], [43.0, 44.76], [48.0, 48.42], [51.0, 51.63], [54.0, 54.04], [58.0, 58.13], [60.0, 60.32], [65.0, 65.48], [67.0, 70.56], [71.0, 71.74], [72.0, 72.47], [74.0, 74.07], [75.0, 78.07], [80.0, 81.57], [83.0, 84.48], [85.0, 85.67], [86.0, 86.81], [87.0, 88.74], [89.0, 89.95], [91.0, 92.5], [93.0, 95.49], [97.0, 97.73], [98.0, 99.3], [101.0, 101.26], [105.0, 106.62], [107.0, 121.05], [126.0, 127.36], [129.0, 129.34], [131.0, 131.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.29, 1.53, -0.04, 0.18, 0.7, 0.77, 0.3, 0.44, -0.05, 1.16, 0.46, 0.26, -0.15, 0.54, 0.36, 0.28, 0.51, 0.38, 1.46, -0.12, 1.76, 0.42, 0.63, 0.04, 0.13, 0.32, 0.48, 3.56, 0.74, 0.47, 0.07, 3.07, 1.57, 1.48, 0.67, 0.81, 1.74, 0.95, 1.5, 2.49, 0.73, 1.3, 0.26, 1.62, 14.05, 1.36, 0.34, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/jlcZPO2FhGE_filtered.json b/annotations_filtered/jlcZPO2FhGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12949b5a1c72a506e8155ad8dc60ce8c67552834 --- /dev/null +++ b/annotations_filtered/jlcZPO2FhGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [4.0, 9.76], [10.0, 24.92], [27.0, 26.96], [27.0, 28.21], [30.0, 34.16], [35.0, 39.85], [41.0, 41.62], [45.0, 46.58], [47.0, 48.39], [55.0, 56.08], [57.0, 58.06], [59.0, 59.7], [61.0, 62.92], [64.0, 64.15], [68.0, 68.03], [70.0, 71.52], [72.0, 72.28], [76.0, 84.62], [85.0, 86.88], [88.0, 93.36], [94.0, 95.1], [99.0, 102.79], [106.0, 105.98], [106.0, 107.1], [112.0, 112.95], [114.0, 114.64], [115.0, 116.58], [117.0, 118.07], [119.0, 120.06], [121.0, 121.22], [122.0, 122.98]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 54.7, 46.4, 0.0, 0.0, 34.76, 40.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 0.0, 38.97, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.08], ["speech", 17.2], ["ping", 8.39]], null, null, [["music", 56.05], ["didgeridoo", 21.42], ["speech", 3.91]], [["music", 48.24], ["didgeridoo", 9.73], ["hum", 8.04]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.36], ["music", 29.5], ["musical instrument", 4.38]], null, [["music", 60.15], ["didgeridoo", 16.78], ["musical instrument", 8.86]], null, [["music", 21.39], ["throbbing", 9.43], ["hum", 9.08]], null, null, null, null, null, null, null, null, null], "duration": [2.01, 5.76, 14.92, -0.04, 1.21, 4.16, 4.85, 0.62, 1.58, 1.39, 1.08, 1.06, 0.7, 1.92, 0.15, 0.03, 1.52, 0.28, 8.62, 1.88, 5.36, 1.1, 3.79, -0.02, 1.1, 0.95, 0.64, 1.58, 1.07, 1.06, 0.22, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/jm73CCe1e4o_filtered.json b/annotations_filtered/jm73CCe1e4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..341a2dca29394b2972b157ac453a1fbc502993b9 --- /dev/null +++ b/annotations_filtered/jm73CCe1e4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [27.0, 28.95], [50.0, 50.41], [57.0, 58.77], [63.0, 63.69], [100.0, 102.96], [105.0, 105.48], [107.0, 110.61], [114.0, 120.7]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 54.43, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.95, 0.41, 1.77, 0.69, 2.96, 0.48, 3.61, 6.7]} \ No newline at end of file diff --git a/annotations_filtered/jmC2y7EsXqk_filtered.json b/annotations_filtered/jmC2y7EsXqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17e9fea5205700744703478d66e77e2c18a3b823 --- /dev/null +++ b/annotations_filtered/jmC2y7EsXqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.45], [13.0, 12.53], [14.0, 32.05], [32.0, 35.68], [40.0, 42.58], [45.0, 46.01], [49.0, 49.35], [50.0, 63.09], [63.0, 63.15]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [31.8, 0.0, 32.68, 37.22, 75.55, 0.0, 0.0, 58.3, 0.0], "audiomae_on_audioset": [[["music", 65.51], ["synthesizer", 3.9], ["sampler", 3.46]], null, [["music", 55.52], ["speech", 12.68], ["sidetone", 6.55]], [["music", 23.76], ["thunk", 21.46], ["whack, thwack", 10.09]], null, null, null, null, null], "duration": [5.45, -0.47, 18.05, 3.68, 2.58, 1.01, 0.35, 13.09, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/jmFpZsBB53s_filtered.json b/annotations_filtered/jmFpZsBB53s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16645defc3c5906fa642e64bd03b2a38af56b69a --- /dev/null +++ b/annotations_filtered/jmFpZsBB53s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 33.42], [36.0, 37.17], [37.0, 38.37], [40.0, 40.41], [41.0, 43.53], [44.0, 44.37], [45.0, 46.72], [54.0, 59.17], [63.0, 63.66], [67.0, 69.3], [80.0, 83.98], [85.0, 85.97], [95.0, 101.56], [104.0, 104.55], [106.0, 105.95], [110.0, 110.47], [116.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 36.72, 0.0, 36.53, 46.29, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["groan", 77.97], ["speech", 7.46], ["whack, thwack", 5.36]], null, [["music", 16.45], ["speech", 7.53], ["animal", 2.52]], [["boing", 27.81], ["thunk", 18.54], ["music", 8.17]], null, null, null, null, null, null], "duration": [2.42, 1.17, 1.37, 0.41, 2.53, 0.37, 1.72, 5.17, 0.66, 2.3, 3.98, 0.97, 6.56, 0.55, -0.05, 0.47, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/jmOvg7JKjVI_filtered.json b/annotations_filtered/jmOvg7JKjVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b643857e403017a36dee116a1f0d289b17392db8 --- /dev/null +++ b/annotations_filtered/jmOvg7JKjVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.67], [5.0, 5.95], [9.0, 11.15], [12.0, 14.34], [15.0, 17.78], [20.0, 20.6], [23.0, 25.12], [26.0, 28.9], [37.0, 37.91], [42.0, 43.71], [47.0, 47.88], [51.0, 52.12], [57.0, 57.15], [63.0, 63.76], [80.0, 79.83], [89.0, 89.5], [98.0, 98.83], [103.0, 106.24], [110.0, 114.94], [117.0, 118.23], [120.0, 121.47]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.82, 91.81, 97.33, 0.0, 39.58, 40.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 17.3], ["speech", 16.73], ["busy signal", 7.35]], [["speech", 43.55], ["sidetone", 27.7], ["hum", 4.83]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 0.95, 2.15, 2.34, 2.78, 0.6, 2.12, 2.9, 0.91, 1.71, 0.88, 1.12, 0.15, 0.76, -0.17, 0.5, 0.83, 3.24, 4.94, 1.23, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/jmgV3OFn0aE_filtered.json b/annotations_filtered/jmgV3OFn0aE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c17d023ac3e09395da16caa7f3c4181b52c4d62 --- /dev/null +++ b/annotations_filtered/jmgV3OFn0aE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.17], [25.0, 29.81], [30.0, 33.0], [33.0, 44.1], [52.0, 51.78], [52.0, 53.74], [54.0, 55.41], [57.0, 57.4], [58.0, 59.54], [61.0, 62.88], [65.0, 66.36], [67.0, 68.3], [71.0, 71.83], [74.0, 75.46], [76.0, 78.6], [79.0, 80.77], [81.0, 81.57], [82.0, 86.73], [88.0, 90.46], [91.0, 92.53], [94.0, 94.8], [96.0, 96.75], [97.0, 97.5], [99.0, 98.83], [99.0, 99.81], [102.0, 103.05], [104.0, 106.27], [107.0, 110.27], [110.0, 112.92], [114.0, 118.86], [120.0, 120.11], [121.0, 121.85], [123.0, 123.85], [131.0, 133.76], [135.0, 137.32], [138.0, 138.81], [141.0, 142.26], [144.0, 145.12], [147.0, 148.05]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.0, 56.48, 46.79, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 40.52, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 65.2, 52.22, 85.72, 0.0, 0.0, 0.0, 99.78, 35.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 78.22], ["dog", 2.57], ["animal", 2.21]], null, [["speech", 56.86], ["baby laughter", 6.2], ["hum", 3.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.59], ["dial tone", 8.1], ["busy signal", 5.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 50.77], ["speech", 40.32], ["sine wave", 1.91]], null, null, null, null], "duration": [3.17, 4.81, 3.0, 11.1, -0.22, 1.74, 1.41, 0.4, 1.54, 1.88, 1.36, 1.3, 0.83, 1.46, 2.6, 1.77, 0.57, 4.73, 2.46, 1.53, 0.8, 0.75, 0.5, -0.17, 0.81, 1.05, 2.27, 3.27, 2.92, 4.86, 0.11, 0.85, 0.85, 2.76, 2.32, 0.81, 1.26, 1.12, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/jmjcKSMwC1Y_filtered.json b/annotations_filtered/jmjcKSMwC1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1bd95360aa69a70c4f06428623a75dec34958d --- /dev/null +++ b/annotations_filtered/jmjcKSMwC1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 5.05], [7.0, 7.15], [13.0, 15.5], [17.0, 19.87], [20.0, 20.44], [20.0, 20.49], [21.0, 22.25], [24.0, 30.45], [33.0, 33.29], [34.0, 36.0], [37.0, 38.58], [41.0, 42.84], [44.0, 46.92], [48.0, 48.88], [50.0, 52.24], [54.0, 55.02], [58.0, 58.43], [59.0, 61.33], [63.0, 66.29], [69.0, 70.51], [72.0, 76.03], [78.0, 78.44], [80.0, 81.38], [86.0, 88.3], [90.0, 98.05], [99.0, 102.71], [104.0, 112.75], [120.0, 120.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 0.0, 0.0, 99.98, 0.0, 99.91, 0.0, 0.0, 99.92, 0.0, 99.98, 0.0, 0.0, 99.78, 99.76, 0.0, 99.82, 0.0, 0.0, 99.96, 98.01, 94.95, 71.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 1.05, 0.15, 2.5, 2.87, 0.44, 0.49, 1.25, 6.45, 0.29, 2.0, 1.58, 1.84, 2.92, 0.88, 2.24, 1.02, 0.43, 2.33, 3.29, 1.51, 4.03, 0.44, 1.38, 2.3, 8.05, 3.71, 8.75, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/jmmawolzwCs_filtered.json b/annotations_filtered/jmmawolzwCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7da9e3285259efa3857c0f44e786d3381500a36c --- /dev/null +++ b/annotations_filtered/jmmawolzwCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [5.0, 8.16], [9.0, 23.06], [24.0, 27.3], [28.0, 29.05], [31.0, 35.28], [36.0, 49.37], [52.0, 52.3], [54.0, 60.08], [61.0, 63.36], [64.0, 65.84], [67.0, 88.08], [89.0, 101.68], [103.0, 120.41], [121.0, 127.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.65, 95.23, 99.97, 0.0, 100.0, 99.82, 0.0, 100.0, 100.0, 0.0, 100.0, 99.62, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 3.16, 14.06, 3.3, 1.05, 4.28, 13.37, 0.3, 6.08, 2.36, 1.84, 21.08, 12.68, 17.41, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/jmpuAz59EbQ_filtered.json b/annotations_filtered/jmpuAz59EbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c2560aef9493f5aa34b52b4e4a7b416cec2e8f --- /dev/null +++ b/annotations_filtered/jmpuAz59EbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.91], [13.0, 13.39], [16.0, 16.7], [18.0, 20.22], [31.0, 32.68], [45.0, 47.39], [49.0, 50.38], [54.0, 54.63], [61.0, 61.62], [63.0, 63.91], [65.0, 65.1], [68.0, 69.67], [72.0, 72.62], [73.0, 73.8], [74.0, 74.51], [76.0, 79.24], [86.0, 87.3], [89.0, 91.77], [93.0, 93.6], [96.0, 106.0]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 96.66, 0.0, 44.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 35.26, 0.0, 41.93], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 19.57], ["music", 9.37], ["dog", 3.47]], null, null, null, null, null, null, null, null, null, [["animal", 16.79], ["livestock, farm animals, working animals", 16.13], ["howl", 8.16]], null, [["drum machine", 24.37], ["music", 8.05], ["synthesizer", 5.46]], null, [["speech", 51.9], ["fart", 11.17], ["sidetone", 3.81]]], "duration": [0.91, 0.39, 0.7, 2.22, 1.68, 2.39, 1.38, 0.63, 0.62, 0.91, 0.1, 1.67, 0.62, 0.8, 0.51, 3.24, 1.3, 2.77, 0.6, 10.0]} \ No newline at end of file diff --git a/annotations_filtered/jmuC1ebmYQg_filtered.json b/annotations_filtered/jmuC1ebmYQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cf304acbb46e3aa9414929e87a0a76d7bf789d8 --- /dev/null +++ b/annotations_filtered/jmuC1ebmYQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [5.0, 13.14], [15.0, 15.82], [18.0, 22.3], [39.0, 39.58], [43.0, 43.58], [45.0, 46.31], [47.0, 47.24], [54.0, 54.46], [55.0, 56.81], [59.0, 59.58], [60.0, 61.4], [62.0, 62.94], [67.0, 69.94], [72.0, 73.47], [74.0, 79.64], [85.0, 86.7], [90.0, 90.15], [93.0, 93.83], [94.0, 94.07], [95.0, 96.01], [97.0, 97.53], [98.0, 110.42], [111.0, 112.97], [116.0, 117.37], [119.0, 119.38], [124.0, 127.57], [128.0, 130.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.29, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 34.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 77.53, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.58], ["speech", 14.92], ["scratching (performance technique)", 2.69]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 8.14, 0.82, 4.3, 0.58, 0.58, 1.31, 0.24, 0.46, 1.81, 0.58, 1.4, 0.94, 2.94, 1.47, 5.64, 1.7, 0.15, 0.83, 0.07, 1.01, 0.53, 12.42, 1.97, 1.37, 0.38, 3.57, 2.89]} \ No newline at end of file diff --git a/annotations_filtered/jn2weAEOp4Q_filtered.json b/annotations_filtered/jn2weAEOp4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2da178375405fa97058280a6ab0b332c76be6ae4 --- /dev/null +++ b/annotations_filtered/jn2weAEOp4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 50.31], [50.0, 50.99], [54.0, 56.12], [57.0, 65.18], [66.0, 68.88]], "keep_status": [false, false, true, true, true], "silence_prob": [31.01, 0.0, 30.34, 29.77, 31.36], "audiomae_on_audioset": [[["music", 46.4], ["speech", 29.95], ["throbbing", 3.54]], null, [["explosion", 13.6], ["eruption", 9.21], ["noise", 8.99]], [["music", 31.76], ["speech", 23.93], ["hum", 8.41]], [["music", 33.82], ["speech", 23.98], ["fly, housefly", 5.28]]], "duration": [5.31, 0.99, 2.12, 8.18, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/jn4Vhkmb4Lw_filtered.json b/annotations_filtered/jn4Vhkmb4Lw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d81dfc2564fd5d78bdaf7eebae46d86351bed2 --- /dev/null +++ b/annotations_filtered/jn4Vhkmb4Lw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.92], [24.0, 27.94], [39.0, 47.16], [49.0, 51.24], [54.0, 55.48], [57.0, 57.94], [59.0, 66.01], [69.0, 107.59]], "keep_status": [false, false, true, true, false, false, false, false], "silence_prob": [42.37, 34.88, 38.7, 34.06, 0.0, 0.0, 34.85, 0.0], "audiomae_on_audioset": [[["music", 62.98], ["musical instrument", 6.84], ["guitar", 6.81]], [["fly, housefly", 40.81], ["insect", 35.53], ["music", 6.62]], [["speech", 34.78], ["music", 16.91], ["mains hum", 10.1]], [["hum", 39.24], ["music", 11.27], ["throbbing", 10.56]], null, null, [["music", 49.51], ["hum", 14.06], ["throbbing", 11.01]], null], "duration": [15.92, 3.94, 8.16, 2.24, 1.48, 0.94, 7.01, 38.59]} \ No newline at end of file diff --git a/annotations_filtered/jn8SVc374U0_filtered.json b/annotations_filtered/jn8SVc374U0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bee3bcaedf5bac2c4fde53965b17d4fa89a03cb2 --- /dev/null +++ b/annotations_filtered/jn8SVc374U0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 62.99], [63.0, 63.1], [64.0, 87.94]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 35.82], "audiomae_on_audioset": [null, null, [["music", 30.38], ["hum", 24.08], ["mains hum", 22.24]]], "duration": [0.99, 0.1, 23.94]} \ No newline at end of file diff --git a/annotations_filtered/jnA7jmNVYFs_filtered.json b/annotations_filtered/jnA7jmNVYFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b54a78969da0033c9d417b9e5f13c6dd70b9ffb8 --- /dev/null +++ b/annotations_filtered/jnA7jmNVYFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [0.0, 0.14], [3.0, 2.73], [4.0, 4.14], [8.0, 12.46], [13.0, 13.29], [14.0, 14.17], [16.0, 17.2], [21.0, 21.63], [23.0, 24.34], [26.0, 25.78], [26.0, 25.95], [54.0, 55.36], [56.0, 55.97], [60.0, 61.47], [66.0, 66.41], [73.0, 74.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.14, -0.27, 0.14, 4.46, 0.29, 0.17, 1.2, 0.63, 1.34, -0.22, -0.05, 1.36, -0.03, 1.47, 0.41, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/jn_D02Tvr4k_filtered.json b/annotations_filtered/jn_D02Tvr4k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb7e6ce3625fa7e0c6a0d1389dac7fcc92a5fa93 --- /dev/null +++ b/annotations_filtered/jn_D02Tvr4k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [5.0, 5.93], [7.0, 7.21], [10.0, 12.7], [14.0, 15.67], [17.0, 17.95], [19.0, 19.33], [21.0, 22.2], [25.0, 26.3], [27.0, 29.42], [31.0, 31.99], [34.0, 34.65], [37.0, 37.47], [39.0, 39.43], [40.0, 42.15], [44.0, 46.63], [48.0, 47.9], [51.0, 51.83], [57.0, 59.37], [63.0, 66.26], [68.0, 70.39], [75.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.97, 99.62, 0.0, 0.0, 76.86, 58.38, 100.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.33, 0.93, 0.21, 2.7, 1.67, 0.95, 0.33, 1.2, 1.3, 2.42, 0.99, 0.65, 0.47, 0.43, 2.15, 2.63, -0.1, 0.83, 2.37, 3.26, 2.39, 4.91]} \ No newline at end of file diff --git a/annotations_filtered/jniUBhuJSuw_filtered.json b/annotations_filtered/jniUBhuJSuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..058e1fec6ce0cc6ffd01367eb1a56a07089951b5 --- /dev/null +++ b/annotations_filtered/jniUBhuJSuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 22.71], [24.0, 29.71], [31.0, 32.04], [33.0, 41.57], [42.0, 48.07], [49.0, 75.39], [78.0, 92.6], [94.0, 122.96], [123.0, 123.94], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [54.36, 37.12, 0.0, 31.4, 32.57, 31.18, 31.72, 35.62, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 51.11], ["synthesizer", 14.15], ["effects unit", 9.66]], null, [["music", 61.98], ["theremin", 5.01], ["musical instrument", 4.84]], [["music", 46.87], ["theremin", 24.24], ["didgeridoo", 8.49]], [["music", 60.37], ["theremin", 16.01], ["didgeridoo", 7.32]], [["music", 54.9], ["musical instrument", 8.09], ["brass instrument", 4.02]], [["music", 73.69], ["theremin", 17.73], ["musical instrument", 1.94]], null, null], "duration": [21.71, 5.71, 1.04, 8.57, 6.07, 26.39, 14.6, 28.96, 0.94, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/jnoCeqeNM3g_filtered.json b/annotations_filtered/jnoCeqeNM3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8985f6d33c02f9c427f99eda4ee44f5fddcbbe2d --- /dev/null +++ b/annotations_filtered/jnoCeqeNM3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [3.0, 3.54], [8.0, 8.58], [9.0, 9.58], [11.0, 11.21], [37.0, 38.58], [40.0, 41.25], [42.0, 45.32], [48.0, 48.61], [52.0, 52.32], [60.0, 60.98], [99.0, 99.05], [101.0, 101.85], [103.0, 103.94], [112.0, 112.04], [114.0, 115.11], [127.0, 127.35], [132.0, 134.33], [138.0, 137.86], [139.0, 139.77], [140.0, 140.48], [141.0, 141.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.02], ["hum", 13.93], ["mains hum", 6.14]], null, null, null, null], "duration": [0.45, 0.54, 0.58, 0.58, 0.21, 1.58, 1.25, 3.32, 0.61, 0.32, 0.98, 0.05, 0.85, 0.94, 0.04, 1.11, 0.35, 2.33, -0.14, 0.77, 0.48, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/jo-aQkgNMKQ_filtered.json b/annotations_filtered/jo-aQkgNMKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..921b78ec8a45848bbf824e58168b0ac389bca388 --- /dev/null +++ b/annotations_filtered/jo-aQkgNMKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [10.0, 10.98], [11.0, 14.69], [19.0, 38.55], [40.0, 39.99], [41.0, 41.76], [42.0, 44.59], [47.0, 47.93], [50.0, 51.61], [55.0, 56.54], [58.0, 58.56], [62.0, 62.94], [66.0, 66.83], [67.0, 67.59], [69.0, 69.85], [70.0, 70.55], [80.0, 80.06], [82.0, 83.05], [88.0, 89.72], [92.0, 92.42], [95.0, 95.96], [97.0, 98.9], [106.0, 106.54], [111.0, 111.5], [115.0, 117.96], [119.0, 122.0], [124.0, 125.0], [126.0, 126.84], [130.0, 131.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.97, 54.7, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 74.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.98, 3.69, 19.55, -0.01, 0.76, 2.59, 0.93, 1.61, 1.54, 0.56, 0.94, 0.83, 0.59, 0.85, 0.55, 0.06, 1.05, 1.72, 0.42, 0.96, 1.9, 0.54, 0.5, 2.96, 3.0, 1.0, 0.84, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/joAodEzeK34_filtered.json b/annotations_filtered/joAodEzeK34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53c646158ec96bb59b9f3e70131b73cdc9839ea9 --- /dev/null +++ b/annotations_filtered/joAodEzeK34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 31.8], [34.0, 37.37], [40.0, 52.68], [55.0, 59.91], [64.0, 68.42], [69.0, 75.96], [78.0, 87.29], [88.0, 88.7], [90.0, 94.39], [96.0, 96.69]], "keep_status": [false, true, false, false, true, true, true, false, true, false], "silence_prob": [31.16, 32.34, 31.28, 31.98, 31.08, 30.67, 31.23, 0.0, 32.12, 0.0], "audiomae_on_audioset": [[["speech", 55.29], ["music", 13.02], ["mains hum", 6.45]], [["speech", 43.58], ["music", 23.31], ["musical instrument", 2.03]], [["hum", 31.76], ["throbbing", 22.29], ["music", 18.65]], [["music", 69.68], ["throbbing", 5.45], ["hum", 2.62]], [["music", 38.27], ["hum", 8.08], ["mains hum", 5.48]], [["theremin", 26.88], ["music", 25.26], ["synthesizer", 9.23]], [["speech", 23.83], ["music", 21.41], ["cacophony", 4.6]], null, [["throbbing", 24.88], ["hum", 20.9], ["music", 9.41]], null], "duration": [12.8, 3.37, 12.68, 4.91, 4.42, 6.96, 9.29, 0.7, 4.39, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/jocnzvDLA60_filtered.json b/annotations_filtered/jocnzvDLA60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8515df0ea53a06e86d0665ed0cd9a152ee75744 --- /dev/null +++ b/annotations_filtered/jocnzvDLA60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.28]], "keep_status": [true], "silence_prob": [47.39], "audiomae_on_audioset": [[["hum", 27.87], ["mains hum", 12.3], ["music", 12.09]]], "duration": [2.28]} \ No newline at end of file diff --git a/annotations_filtered/jojFdN-oysU_filtered.json b/annotations_filtered/jojFdN-oysU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e53897332db113ec72177cd6566f319f07b6dfc --- /dev/null +++ b/annotations_filtered/jojFdN-oysU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 41.72], [42.0, 45.87], [52.0, 52.29], [53.0, 98.24], [103.0, 103.82], [105.0, 116.06], [128.0, 130.79]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [29.71, 32.03, 0.0, 0.0, 0.0, 29.18, 30.45], "audiomae_on_audioset": [[["music", 71.34], ["throbbing", 10.16], ["electronic music", 3.54]], [["livestock, farm animals, working animals", 43.81], ["cattle, bovinae", 35.45], ["moo", 18.13]], null, null, null, [["music", 45.25], ["didgeridoo", 9.0], ["speech", 3.69]], [["music", 31.74], ["theremin", 24.36], ["mains hum", 11.85]]], "duration": [12.72, 3.87, 0.29, 45.24, 0.82, 11.06, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/jot1h4tgY6M_filtered.json b/annotations_filtered/jot1h4tgY6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c585eac9b7755f6dba94c443d928e68f9e51b257 --- /dev/null +++ b/annotations_filtered/jot1h4tgY6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [4.0, 4.06], [7.0, 8.8], [15.0, 16.41], [22.0, 24.07], [30.0, 30.38], [32.0, 33.61], [46.0, 46.68], [48.0, 49.91], [63.0, 63.15], [64.0, 64.4], [85.0, 88.32], [91.0, 91.07], [93.0, 93.09], [94.0, 98.86], [156.0, 163.14], [168.0, 174.95], [175.0, 175.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 99.16, 33.17, 47.82, 0.0], "audiomae_on_audioset": [null, null, null, null, [["theremin", 39.77], ["music", 37.62], ["singing bowl", 1.88]], null, null, null, null, null, null, null, null, null, null, [["speech", 42.87], ["breaking", 23.29], ["glass", 20.99]], [["animal", 26.16], ["explosion", 17.41], ["eruption", 5.74]], null], "duration": [0.31, 0.06, 1.8, 1.41, 2.07, 0.38, 1.61, 0.68, 1.91, 0.15, 0.4, 3.32, 0.07, 0.09, 4.86, 7.14, 6.95, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/jowNLHQCAAY_filtered.json b/annotations_filtered/jowNLHQCAAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af9201a65e3d62613279ee11aee205d51eb9f1b3 --- /dev/null +++ b/annotations_filtered/jowNLHQCAAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [6.0, 6.69], [8.0, 10.13], [11.0, 12.48], [13.0, 14.01], [15.0, 15.5], [21.0, 20.7], [24.0, 24.66], [26.0, 26.69], [33.0, 36.96], [38.0, 38.97], [40.0, 41.2], [45.0, 45.66], [47.0, 47.8], [57.0, 60.13], [62.0, 63.39], [65.0, 66.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 0.69, 2.13, 1.48, 1.01, 0.5, -0.3, 0.66, 0.69, 3.96, 0.97, 1.2, 0.66, 0.8, 3.13, 1.39, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/jpEfgrff8z0_filtered.json b/annotations_filtered/jpEfgrff8z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c97f90fe567006b5b7f2c5f9e258e0d7764fd814 --- /dev/null +++ b/annotations_filtered/jpEfgrff8z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.72], [23.0, 23.38], [32.0, 35.94], [51.0, 51.31], [54.0, 54.09], [61.0, 61.8], [64.0, 63.78], [74.0, 73.99], [81.0, 85.06], [94.0, 95.07], [98.0, 103.28], [135.0, 136.56], [140.0, 140.17], [148.0, 149.52], [174.0, 177.5]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 65.67, 0.0, 0.0, 0.0, 32.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 19.37], ["music", 15.54], ["speech", 15.19]], null, null, null, null, null, [["music", 40.03], ["speech", 32.56], ["thunk", 10.13]]], "duration": [4.72, 0.38, 3.94, 0.31, 0.09, 0.8, -0.22, -0.01, 4.06, 1.07, 5.28, 1.56, 0.17, 1.52, 3.5]} \ No newline at end of file diff --git a/annotations_filtered/jpIVQIuoX1g_filtered.json b/annotations_filtered/jpIVQIuoX1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..503b42cf4dbe37eebd88901c6684107bd980e01d --- /dev/null +++ b/annotations_filtered/jpIVQIuoX1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.8], [9.0, 9.1], [11.0, 16.24], [17.0, 21.15], [24.0, 23.99], [25.0, 26.76], [31.0, 31.53], [34.0, 102.9], [105.0, 107.22]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 92.48, 93.76, 0.0, 0.0, 0.0, 0.0, 77.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.8, 0.1, 5.24, 4.15, -0.01, 1.76, 0.53, 68.9, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/jpPCVq8UmX4_filtered.json b/annotations_filtered/jpPCVq8UmX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bea9b52c62341ff2b6c544a8c5d12a573f761b8 --- /dev/null +++ b/annotations_filtered/jpPCVq8UmX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [3.0, 3.6], [5.0, 5.54], [7.0, 8.01], [12.0, 11.7], [14.0, 14.08], [15.0, 15.99], [19.0, 19.58], [20.0, 20.7], [21.0, 21.54], [24.0, 25.03], [26.0, 26.0], [28.0, 30.08], [38.0, 38.08], [39.0, 63.61], [70.0, 70.53], [78.0, 78.87], [80.0, 79.86], [83.0, 83.98], [86.0, 104.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 36.03, 0.0, 0.0, 0.0, 0.0, 40.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.13], ["music", 14.5], ["hum", 6.34]], null, [["music", 66.76], ["carnatic music", 2.86], ["musical instrument", 2.81]], null, null, null, null, [["speech", 22.11], ["bee, wasp, etc.", 17.82], ["fly, housefly", 15.29]]], "duration": [0.02, 0.6, 0.54, 1.01, -0.3, 0.08, 0.99, 0.58, 0.7, 0.54, 1.03, 0.0, 2.08, 0.08, 24.61, 0.53, 0.87, -0.14, 0.98, 18.06]} \ No newline at end of file diff --git a/annotations_filtered/jpTj6qTyIwY_filtered.json b/annotations_filtered/jpTj6qTyIwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..640d0e5ef69ab8fa73b4697a232d15ab657bb457 --- /dev/null +++ b/annotations_filtered/jpTj6qTyIwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.74], [16.0, 16.63], [17.0, 17.9], [19.0, 19.62], [28.0, 36.95], [37.0, 47.92], [48.0, 52.2], [55.0, 64.5], [66.0, 67.24], [70.0, 76.5], [77.0, 78.38], [81.0, 81.84], [83.0, 87.2], [90.0, 102.93], [105.0, 104.72], [105.0, 105.31], [106.0, 113.53], [116.0, 133.74], [135.0, 135.55], [139.0, 141.34], [143.0, 143.8], [144.0, 156.34]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [52.05, 0.0, 0.0, 0.0, 36.6, 39.4, 42.72, 40.19, 0.0, 45.4, 0.0, 0.0, 35.99, 36.04, 0.0, 0.0, 34.58, 40.43, 0.0, 36.62, 0.0, 35.37], "audiomae_on_audioset": [null, null, null, null, [["music", 69.91], ["hum", 5.26], ["throbbing", 3.66]], [["hum", 27.91], ["speech", 19.81], ["mains hum", 12.1]], [["music", 25.18], ["hum", 22.7], ["speech", 9.51]], [["speech", 24.87], ["music", 22.35], ["sheep", 4.47]], null, [["speech", 41.93], ["music", 33.44], ["sidetone", 3.88]], null, null, [["didgeridoo", 25.15], ["groan", 17.71], ["music", 14.87]], [["livestock, farm animals, working animals", 33.01], ["cattle, bovinae", 30.35], ["moo", 24.11]], null, null, [["music", 29.43], ["fly, housefly", 11.49], ["cattle, bovinae", 8.38]], [["speech", 42.2], ["cattle, bovinae", 8.57], ["livestock, farm animals, working animals", 6.31]], null, [["whale vocalization", 88.98], ["moo", 1.33], ["livestock, farm animals, working animals", 0.85]], null, [["music", 50.17], ["speech", 26.75], ["musical instrument", 1.28]]], "duration": [4.74, 0.63, 0.9, 0.62, 8.95, 10.92, 4.2, 9.5, 1.24, 6.5, 1.38, 0.84, 4.2, 12.93, -0.28, 0.31, 7.53, 17.74, 0.55, 2.34, 0.8, 12.34]} \ No newline at end of file diff --git a/annotations_filtered/jpoR10Zh0ig_filtered.json b/annotations_filtered/jpoR10Zh0ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c146f91cef5b4512bd4e8793b08f5de78abc97d --- /dev/null +++ b/annotations_filtered/jpoR10Zh0ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [6.0, 6.59], [8.0, 10.12], [12.0, 14.18], [16.0, 16.88], [19.0, 19.26], [21.0, 22.17], [24.0, 34.4], [37.0, 37.79], [40.0, 41.07], [45.0, 45.99], [48.0, 48.84], [50.0, 51.63], [56.0, 57.6], [61.0, 61.42], [62.0, 62.11], [63.0, 64.05], [66.0, 66.6], [67.0, 69.01], [71.0, 72.91], [74.0, 74.51], [75.0, 76.28], [79.0, 80.47], [88.0, 88.3], [94.0, 95.45], [97.0, 97.43], [98.0, 99.23], [108.0, 111.06], [117.0, 117.9], [121.0, 122.32], [123.0, 124.24], [126.0, 126.91], [128.0, 128.85], [132.0, 132.07], [133.0, 134.0], [139.0, 138.99], [145.0, 158.75], [160.0, 161.3], [163.0, 163.78], [165.0, 166.23], [167.0, 171.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.95, 66.51, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 79.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.59, 2.12, 2.18, 0.88, 0.26, 1.17, 10.4, 0.79, 1.07, 0.99, 0.84, 1.63, 1.6, 0.42, 0.11, 1.05, 0.6, 2.01, 1.91, 0.51, 1.28, 1.47, 0.3, 1.45, 0.43, 1.23, 3.06, 0.9, 1.32, 1.24, 0.91, 0.85, 0.07, 1.0, -0.01, 13.75, 1.3, 0.78, 1.23, 4.83]} \ No newline at end of file diff --git a/annotations_filtered/jq2tARSds7M_filtered.json b/annotations_filtered/jq2tARSds7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d75d295e014cb9db94bd17449c917eb304290c2 --- /dev/null +++ b/annotations_filtered/jq2tARSds7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [9.0, 26.43], [34.0, 36.88], [53.0, 53.97], [55.0, 56.15], [59.0, 70.7], [72.0, 74.58], [79.0, 85.28], [90.0, 90.64], [91.0, 92.43], [113.0, 119.26], [121.0, 120.82], [123.0, 123.52], [125.0, 125.27], [126.0, 128.82], [130.0, 130.76]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.26, 41.68, 0.0, 0.0, 65.91, 98.36, 41.14, 0.0, 0.0, 42.35, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 13.98], ["animal", 13.87], ["electric shaver, electric razor", 10.38]], [["speech", 81.1], ["fart", 5.57], ["music", 0.73]], null, null, null, null, [["speech", 47.87], ["hum", 10.19], ["mains hum", 7.07]], null, null, [["music", 64.81], ["synthesizer", 5.16], ["throbbing", 3.58]], null, null, null, null, null], "duration": [0.14, 17.43, 2.88, 0.97, 1.15, 11.7, 2.58, 6.28, 0.64, 1.43, 6.26, -0.18, 0.52, 0.27, 2.82, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/jq_tO6NAlPI_filtered.json b/annotations_filtered/jq_tO6NAlPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..958f09e3f3d437cbc7364f020e633fbc1de93e81 --- /dev/null +++ b/annotations_filtered/jq_tO6NAlPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.54], [21.0, 31.29], [34.0, 35.77], [38.0, 39.63], [43.0, 43.97], [46.0, 48.39], [51.0, 51.49], [53.0, 54.41], [55.0, 56.64], [66.0, 66.82], [67.0, 66.85], [75.0, 75.17], [87.0, 90.63], [106.0, 111.45], [116.0, 119.3], [124.0, 125.51], [126.0, 127.67], [131.0, 140.16], [174.0, 178.51], [179.0, 179.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 85.54, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.28, 32.19, 31.37, 0.0, 0.0, 30.52, 30.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.95], ["boing", 18.1], ["didgeridoo", 13.41]], [["music", 57.83], ["speech", 18.45], ["musical instrument", 2.7]], [["music", 60.21], ["didgeridoo", 17.0], ["boing", 5.39]], null, null, [["music", 90.58], ["didgeridoo", 1.97], ["electronic music", 1.28]], [["music", 61.35], ["boing", 9.33], ["didgeridoo", 3.69]], null], "duration": [2.54, 10.29, 1.77, 1.63, 0.97, 2.39, 0.49, 1.41, 1.64, 0.82, -0.15, 0.17, 3.63, 5.45, 3.3, 1.51, 1.67, 9.16, 4.51, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/jqpkvCebSmU_filtered.json b/annotations_filtered/jqpkvCebSmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09226084c53d3dc14f670445c75080e208911350 --- /dev/null +++ b/annotations_filtered/jqpkvCebSmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.79], [20.0, 61.69], [62.0, 80.84], [82.0, 82.21], [87.0, 91.57], [92.0, 92.65]], "keep_status": [false, false, false, false, false, false], "silence_prob": [64.07, 0.0, 83.16, 0.0, 67.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [6.79, 41.69, 18.84, 0.21, 4.57, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/jqyhGCHT-v0_filtered.json b/annotations_filtered/jqyhGCHT-v0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad9da603ee94d881da3fc488a70feb4746f64338 --- /dev/null +++ b/annotations_filtered/jqyhGCHT-v0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [6.0, 7.11], [10.0, 10.07], [23.0, 23.65], [26.0, 26.55], [32.0, 32.43], [37.0, 37.47], [45.0, 47.24], [51.0, 55.86], [56.0, 57.18], [58.0, 61.53], [62.0, 63.41], [64.0, 65.03], [72.0, 72.69]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.4, 43.71, 0.0, 62.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 34.24], ["speech", 23.63], ["theremin", 4.71]], null, null, null, null, null], "duration": [1.06, 1.11, 0.07, 0.65, 0.55, 0.43, 0.47, 2.24, 4.86, 1.18, 3.53, 1.41, 1.03, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/jqzTeVVmTvc_filtered.json b/annotations_filtered/jqzTeVVmTvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..517139ccb57e5af66684dbe575dd08e2b23fffd6 --- /dev/null +++ b/annotations_filtered/jqzTeVVmTvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [8.0, 8.94], [12.0, 15.06], [16.0, 31.72], [32.0, 33.56], [34.0, 153.57]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.95, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.58, 0.94, 3.06, 15.72, 1.56, 119.57]} \ No newline at end of file diff --git a/annotations_filtered/jr60kvuKw3w_filtered.json b/annotations_filtered/jr60kvuKw3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03664c088a475ba32108786c53f4cf1684e560c5 --- /dev/null +++ b/annotations_filtered/jr60kvuKw3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.17], [23.0, 23.58], [26.0, 45.17], [47.0, 55.31], [59.0, 60.71]], "keep_status": [false, false, true, true, false], "silence_prob": [75.72, 0.0, 32.21, 30.18, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.21], ["speech", 5.63], ["quack", 3.75]], [["hum", 20.33], ["throbbing", 10.67], ["static", 10.27]], null], "duration": [2.17, 0.58, 19.17, 8.31, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/jr7HNZg0ljU_filtered.json b/annotations_filtered/jr7HNZg0ljU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..578e72d9f45bf3595558435381c4af3da1042f7b --- /dev/null +++ b/annotations_filtered/jr7HNZg0ljU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [19.0, 19.4], [20.0, 22.94], [26.0, 26.64], [37.0, 37.35], [38.0, 39.68], [41.0, 43.12], [44.0, 45.69], [46.0, 47.34], [48.0, 49.92], [51.0, 54.48], [58.0, 57.52], [59.0, 59.21], [60.0, 61.59], [63.0, 63.07], [64.0, 64.83], [67.0, 68.28], [69.0, 74.58], [75.0, 77.18], [79.0, 80.92], [81.0, 83.07], [89.0, 89.99], [100.0, 101.06], [103.0, 103.57], [105.0, 105.09], [110.0, 109.97], [113.0, 113.83], [119.0, 120.06], [122.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 69.34, 0.0, 57.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 27.03], ["music", 23.52], ["mains hum", 14.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.4, 2.94, 0.64, 0.35, 1.68, 2.12, 1.69, 1.34, 1.92, 3.48, -0.48, 0.21, 1.59, 0.07, 0.83, 1.28, 5.58, 2.18, 1.92, 2.07, 0.99, 1.06, 0.57, 0.09, -0.03, 0.83, 1.06, 5.38]} \ No newline at end of file diff --git a/annotations_filtered/jr8BKtgMJA0_filtered.json b/annotations_filtered/jr8BKtgMJA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef13a962bb5590da2b1e36fe402512d901bebdfb --- /dev/null +++ b/annotations_filtered/jr8BKtgMJA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.56], [9.0, 9.15], [11.0, 18.76], [19.0, 18.94], [19.0, 19.92], [21.0, 20.88], [21.0, 22.2], [23.0, 24.27], [25.0, 26.87], [32.0, 32.9], [34.0, 35.83], [37.0, 38.3], [39.0, 40.29], [40.0, 40.85], [42.0, 44.63], [47.0, 48.32], [51.0, 52.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 54.75], ["music", 16.57], ["gong", 15.34]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.12], ["music", 28.61], ["musical instrument", 4.17]], null, null], "duration": [0.56, 0.15, 7.76, -0.06, 0.92, -0.12, 1.2, 1.27, 1.87, 0.9, 1.83, 1.3, 1.29, 0.85, 2.63, 1.32, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/jrIc1SlA7O8_filtered.json b/annotations_filtered/jrIc1SlA7O8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6fbe82a0688ed42716b1e054b66a3937fa2fef3 --- /dev/null +++ b/annotations_filtered/jrIc1SlA7O8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.26], [7.0, 6.54], [7.0, 6.57], [7.0, 6.61], [7.0, 6.64], [7.0, 12.12], [22.0, 22.27], [23.0, 23.35], [24.0, 24.85], [25.0, 26.28], [27.0, 27.77], [29.0, 29.81], [32.0, 32.39], [36.0, 35.58], [38.0, 39.73], [41.0, 42.04], [44.0, 46.11], [48.0, 49.27], [50.0, 54.23], [56.0, 58.9]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [47.23, 0.0, 0.0, 0.0, 0.0, 41.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.68, 0.0, 35.1, 35.12], "audiomae_on_audioset": [[["hum", 27.49], ["throbbing", 19.86], ["music", 17.1]], null, null, null, null, [["music", 41.74], ["speech", 22.52], ["hum", 10.62]], null, null, null, null, null, null, null, null, null, null, [["music", 71.25], ["didgeridoo", 6.15], ["throbbing", 3.08]], null, [["music", 34.09], ["hum", 28.73], ["mains hum", 13.09]], [["music", 62.76], ["theremin", 4.32], ["musical instrument", 2.92]]], "duration": [3.26, -0.46, -0.43, -0.39, -0.36, 5.12, 0.27, 0.35, 0.85, 1.28, 0.77, 0.81, 0.39, -0.42, 1.73, 1.04, 2.11, 1.27, 4.23, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/jrLVuKks6lE_filtered.json b/annotations_filtered/jrLVuKks6lE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fc4d10521f5a7ff9a122516743ed974c0c66353 --- /dev/null +++ b/annotations_filtered/jrLVuKks6lE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 24.9], [28.0, 46.75], [47.0, 48.79], [49.0, 49.57], [55.0, 65.62], [66.0, 66.88], [71.0, 70.92], [76.0, 79.83], [82.0, 82.24], [92.0, 104.45], [107.0, 107.77], [115.0, 120.92], [124.0, 125.1], [128.0, 129.2], [132.0, 132.44]], "keep_status": [true, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [38.49, 32.52, 0.0, 0.0, 31.34, 0.0, 0.0, 32.72, 0.0, 48.61, 0.0, 43.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.17], ["hum", 15.93], ["mains hum", 7.46]], [["music", 42.26], ["buzz", 11.68], ["fly, housefly", 7.71]], null, null, [["cattle, bovinae", 37.37], ["livestock, farm animals, working animals", 32.08], ["moo", 24.44]], null, null, [["music", 49.75], ["didgeridoo", 15.73], ["theremin", 9.03]], null, [["hum", 28.13], ["music", 23.89], ["mains hum", 11.42]], null, [["music", 62.47], ["synthesizer", 7.66], ["throbbing", 4.48]], null, null, null], "duration": [11.9, 18.75, 1.79, 0.57, 10.62, 0.88, -0.08, 3.83, 0.24, 12.45, 0.77, 5.92, 1.1, 1.2, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/jrPvugl_NVA_filtered.json b/annotations_filtered/jrPvugl_NVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c88f64643a6e571c7cf668b0636c38cf159ee3b --- /dev/null +++ b/annotations_filtered/jrPvugl_NVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [5.0, 5.19], [5.0, 5.78], [9.0, 9.83], [10.0, 14.99], [15.0, 15.69], [17.0, 20.75], [21.0, 22.27], [24.0, 24.88], [25.0, 25.47], [26.0, 26.4], [41.0, 41.66], [42.0, 42.06], [46.0, 51.26], [52.0, 52.17], [54.0, 54.51], [58.0, 62.63], [64.0, 65.58], [67.0, 67.2], [76.0, 86.32], [87.0, 88.3], [89.0, 89.4], [90.0, 97.21], [100.0, 101.02], [102.0, 102.22], [102.0, 109.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 99.97, 0.0, 0.0, 90.25, 0.0, 0.0, 85.17, 0.0, 0.0, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.19, 0.78, 0.83, 4.99, 0.69, 3.75, 1.27, 0.88, 0.47, 0.4, 0.66, 0.06, 5.26, 0.17, 0.51, 4.63, 1.58, 0.2, 10.32, 1.3, 0.4, 7.21, 1.02, 0.22, 7.78]} \ No newline at end of file diff --git a/annotations_filtered/jr_bZ2gzRIY_filtered.json b/annotations_filtered/jr_bZ2gzRIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26629dedca0d8bd591ffc9d6d12078d6a52ceb6e --- /dev/null +++ b/annotations_filtered/jr_bZ2gzRIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.17], [14.0, 14.25], [17.0, 18.37], [20.0, 20.34], [22.0, 22.6], [27.0, 29.2], [33.0, 34.65], [35.0, 36.24], [38.0, 41.12], [54.0, 54.72], [56.0, 56.83], [57.0, 58.16], [61.0, 62.18], [72.0, 72.39], [74.0, 75.03], [77.0, 77.25], [78.0, 78.75], [81.0, 82.14], [84.0, 84.54], [86.0, 87.69], [88.0, 88.6], [89.0, 90.26], [90.0, 92.11], [93.0, 93.31], [97.0, 97.14], [101.0, 101.26], [107.0, 107.74], [108.0, 111.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 99.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 0.25, 1.37, 0.34, 0.6, 2.2, 1.65, 1.24, 3.12, 0.72, 0.83, 1.16, 1.18, 0.39, 1.03, 0.25, 0.75, 1.14, 0.54, 1.69, 0.6, 1.26, 2.11, 0.31, 0.14, 0.26, 0.74, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/jrf263yJwic_filtered.json b/annotations_filtered/jrf263yJwic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0281f1c711d81af7259b72fe3a41d957f23b24f2 --- /dev/null +++ b/annotations_filtered/jrf263yJwic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [3.0, 4.29], [12.0, 13.02], [22.0, 23.73], [25.0, 27.04], [29.0, 31.41], [33.0, 34.77], [36.0, 35.92], [36.0, 37.05], [39.0, 39.66], [45.0, 46.55], [49.0, 52.07], [53.0, 56.08], [57.0, 59.91], [71.0, 71.54], [73.0, 73.97], [80.0, 83.81], [85.0, 87.74], [88.0, 90.1], [92.0, 94.53], [95.0, 96.06], [97.0, 97.21], [103.0, 102.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 92.48, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 84.25, 54.23, 88.46, 0.0, 0.0, 66.39, 65.09, 73.82, 77.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 1.29, 1.02, 1.73, 2.04, 2.41, 1.77, -0.08, 1.05, 0.66, 1.55, 3.07, 3.08, 2.91, 0.54, 0.97, 3.81, 2.74, 2.1, 2.53, 1.06, 0.21, -0.26]} \ No newline at end of file diff --git a/annotations_filtered/jri0U57iWWM_filtered.json b/annotations_filtered/jri0U57iWWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2d0e33921792efaeb8361e7ece0d5249283e26d --- /dev/null +++ b/annotations_filtered/jri0U57iWWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.74], [12.0, 15.36], [17.0, 23.31], [24.0, 25.88], [29.0, 31.48], [34.0, 36.34], [38.0, 41.07], [43.0, 49.2], [50.0, 54.13], [61.0, 61.74], [69.0, 69.7], [76.0, 76.0], [77.0, 77.79], [115.0, 128.61], [133.0, 133.62], [140.0, 139.68], [141.0, 141.54], [145.0, 145.89], [146.0, 146.08], [146.0, 147.73], [153.0, 152.85], [168.0, 168.51]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.6, 47.62, 0.0, 62.58, 55.39, 48.31, 40.86, 37.06, 0.0, 0.0, 0.0, 0.0, 30.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 36.22], ["mains hum", 24.61], ["rumble", 6.32]], null, null, null, [["hum", 18.14], ["music", 14.46], ["mains hum", 5.43]], [["music", 68.1], ["theremin", 6.78], ["whistling", 3.88]], [["music", 61.85], ["guitar", 11.54], ["musical instrument", 9.76]], null, null, null, null, [["music", 85.31], ["didgeridoo", 4.05], ["musical instrument", 2.79]], null, null, null, null, null, null, null, null], "duration": [0.74, 3.36, 6.31, 1.88, 2.48, 2.34, 3.07, 6.2, 4.13, 0.74, 0.7, 0.0, 0.79, 13.61, 0.62, -0.32, 0.54, 0.89, 0.08, 1.73, -0.15, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/js-kku6X7yU_filtered.json b/annotations_filtered/js-kku6X7yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aaba8a341f1e78129e02c19ebeab38dcb220169 --- /dev/null +++ b/annotations_filtered/js-kku6X7yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [9.0, 9.68], [12.0, 11.87], [14.0, 14.99], [19.0, 20.09], [22.0, 23.95], [27.0, 28.65], [30.0, 31.11], [32.0, 32.02], [33.0, 40.12], [40.0, 40.15], [43.0, 48.83], [52.0, 52.88], [56.0, 56.73], [57.0, 58.18], [59.0, 60.08], [62.0, 62.53], [65.0, 68.34], [73.0, 73.94], [75.0, 76.22], [77.0, 81.84], [83.0, 84.03], [85.0, 90.42], [91.0, 92.4], [93.0, 94.15], [95.0, 96.11], [98.0, 98.44], [108.0, 108.8], [116.0, 116.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.9, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 99.87, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 81.13], ["fart", 4.61], ["music", 2.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.68, -0.13, 0.99, 1.09, 1.95, 1.65, 1.11, 0.02, 7.12, 0.15, 5.83, 0.88, 0.73, 1.18, 1.08, 0.53, 3.34, 0.94, 1.22, 4.84, 1.03, 5.42, 1.4, 1.15, 1.11, 0.44, 0.8, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/js11RqXLkZg_filtered.json b/annotations_filtered/js11RqXLkZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10f102616a04dfce4fb5d58746f7d9fc0ed14c0b --- /dev/null +++ b/annotations_filtered/js11RqXLkZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.58], [14.0, 29.07], [32.0, 33.39], [35.0, 37.1], [41.0, 42.47], [45.0, 46.01], [47.0, 49.23], [50.0, 52.86], [55.0, 56.98], [62.0, 64.5], [65.0, 68.0], [69.0, 74.38], [75.0, 79.56], [81.0, 84.82], [86.0, 86.78], [88.0, 89.85], [91.0, 95.3], [98.0, 100.67], [102.0, 106.19], [107.0, 109.16], [111.0, 121.66], [123.0, 126.81], [128.0, 129.22], [130.0, 132.7], [135.0, 139.08]], "keep_status": [false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 46.57, 0.0, 0.0, 69.07, 40.07, 0.0, 98.99, 38.67, 99.91, 67.0, 53.22, 0.0, 0.0, 96.04, 51.28, 99.87, 98.51, 97.22, 72.16, 0.0, 93.45, 60.6], "audiomae_on_audioset": [null, null, null, [["sidetone", 24.88], ["speech", 17.51], ["music", 12.72]], null, null, null, [["music", 44.89], ["musical instrument", 6.47], ["hum", 6.27]], null, null, [["didgeridoo", 15.87], ["cattle, bovinae", 12.13], ["moo", 11.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.42, 15.07, 1.39, 2.1, 1.47, 1.01, 2.23, 2.86, 1.98, 2.5, 3.0, 5.38, 4.56, 3.82, 0.78, 1.85, 4.3, 2.67, 4.19, 2.16, 10.66, 3.81, 1.22, 2.7, 4.08]} \ No newline at end of file diff --git a/annotations_filtered/jsGX_I6mFvc_filtered.json b/annotations_filtered/jsGX_I6mFvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61129ebd345e523a7a001b239c0adf140dced6b7 --- /dev/null +++ b/annotations_filtered/jsGX_I6mFvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.78], [7.0, 25.96], [29.0, 29.34], [29.0, 29.74], [31.0, 34.1], [34.0, 38.82], [41.0, 41.52], [42.0, 43.23], [44.0, 44.22], [46.0, 46.99], [50.0, 50.85], [53.0, 52.95], [54.0, 88.7], [89.0, 105.68], [107.0, 116.4]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.6, 0.0, 0.0, 99.92, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 50.86], "audiomae_on_audioset": [null, [["music", 30.3], ["hum", 22.63], ["theremin", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.22, 18.96, 0.34, 0.74, 3.1, 4.82, 0.52, 1.23, 0.22, 0.99, 0.85, -0.05, 34.7, 16.68, 9.4]} \ No newline at end of file diff --git a/annotations_filtered/jsL4-BxsZjA_filtered.json b/annotations_filtered/jsL4-BxsZjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9f15b5ae476d8df28a8ff69bab9b8c4c2db7008 --- /dev/null +++ b/annotations_filtered/jsL4-BxsZjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.35], [17.0, 17.83], [21.0, 21.47], [24.0, 25.64], [27.0, 29.25], [31.0, 35.82], [37.0, 41.67], [42.0, 47.82], [49.0, 51.38], [53.0, 57.72], [60.0, 62.19], [63.0, 68.62], [69.0, 68.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 96.04, 99.85, 100.0, 100.0, 99.99, 90.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, 0.83, 0.47, 1.64, 2.25, 4.82, 4.67, 5.82, 2.38, 4.72, 2.19, 5.62, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/jsLOtv4yqIM_filtered.json b/annotations_filtered/jsLOtv4yqIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28cc3df387b17c68228b089a693ecdf67672f680 --- /dev/null +++ b/annotations_filtered/jsLOtv4yqIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [4.0, 22.37], [23.0, 23.7], [25.0, 26.18], [28.0, 28.95], [30.0, 29.93], [30.0, 31.56], [34.0, 40.19], [42.0, 43.63], [46.0, 47.58], [50.0, 51.48], [54.0, 55.56], [57.0, 57.92], [59.0, 60.52], [62.0, 66.39], [67.0, 72.89], [73.0, 74.24], [75.0, 79.15], [81.0, 80.77], [81.0, 82.11], [84.0, 84.03], [85.0, 85.36], [86.0, 100.94], [102.0, 105.46], [106.0, 106.89], [108.0, 116.92], [117.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.05, 0.0, 0.0, 0.0, 0.0, 0.0, 37.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 40.61, 0.0, 42.3, 0.0, 0.0, 0.0, 0.0, 86.27, 99.95, 0.0, 99.05, 0.0], "audiomae_on_audioset": [null, [["music", 62.51], ["sidetone", 8.22], ["musical instrument", 7.01]], null, null, null, null, null, [["throbbing", 31.89], ["hum", 22.23], ["sidetone", 9.86]], null, null, null, null, null, null, null, [["speech", 27.03], ["radio", 16.89], ["sidetone", 15.47]], null, [["dial tone", 20.89], ["radio", 12.36], ["sidetone", 7.35]], null, null, null, null, null, null, null, null, null], "duration": [1.18, 18.37, 0.7, 1.18, 0.95, -0.07, 1.56, 6.19, 1.63, 1.58, 1.48, 1.56, 0.92, 1.52, 4.39, 5.89, 1.24, 4.15, -0.23, 1.11, 0.03, 0.36, 14.94, 3.46, 0.89, 8.92, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/jsLUidiYm0w_filtered.json b/annotations_filtered/jsLUidiYm0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee74d66ca4e08d48405d5f6aed436b51e60c7215 --- /dev/null +++ b/annotations_filtered/jsLUidiYm0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [8.0, 8.51], [18.0, 18.06], [24.0, 23.97], [27.0, 27.99], [35.0, 35.58], [36.0, 37.02], [41.0, 41.86], [51.0, 51.98], [52.0, 55.31], [61.0, 61.72], [62.0, 62.75], [63.0, 62.83], [63.0, 63.0], [69.0, 68.96], [96.0, 96.48], [98.0, 99.59], [117.0, 117.73], [118.0, 118.5], [120.0, 120.07], [126.0, 125.81], [129.0, 129.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.51, 0.06, -0.03, 0.99, 0.58, 1.02, 0.86, 0.98, 3.31, 0.72, 0.75, -0.17, 0.0, -0.04, 0.48, 1.59, 0.73, 0.5, 0.07, -0.19, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/jsUGvhq2MLM_filtered.json b/annotations_filtered/jsUGvhq2MLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f2b2cf476a0d51839d24e78ddd42dc2807621ff --- /dev/null +++ b/annotations_filtered/jsUGvhq2MLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 18.0], [18.0, 19.14], [20.0, 25.37], [26.0, 26.92], [27.0, 32.49], [34.0, 41.59], [44.0, 47.06], [52.0, 55.68], [56.0, 60.13], [62.0, 65.37], [66.0, 66.92], [67.0, 86.51], [91.0, 93.65], [101.0, 104.13], [107.0, 111.74], [112.0, 122.98], [126.0, 142.15], [146.0, 147.07], [149.0, 162.38], [163.0, 167.68]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [30.35, 0.0, 30.38, 0.0, 30.55, 30.14, 40.55, 59.15, 63.53, 71.14, 0.0, 48.56, 41.09, 48.35, 41.48, 51.07, 32.94, 0.0, 32.18, 32.03], "audiomae_on_audioset": [[["music", 86.1], ["musical instrument", 1.23], ["singing", 1.2]], null, [["music", 38.15], ["moo", 12.18], ["cattle, bovinae", 10.04]], null, [["music", 78.48], ["theremin", 1.52], ["funk", 1.25]], [["music", 71.37], ["didgeridoo", 8.41], ["theremin", 2.11]], [["music", 21.43], ["snicker", 18.44], ["chuckle, chortle", 14.97]], null, null, null, null, [["music", 58.47], ["speech", 18.73], ["inside, small room", 4.95]], [["music", 21.09], ["didgeridoo", 18.38], ["tabla", 9.68]], [["speech", 23.02], ["music", 20.87], ["didgeridoo", 4.28]], [["speech", 24.72], ["sidetone", 17.91], ["didgeridoo", 10.0]], null, [["music", 79.56], ["musical instrument", 2.92], ["synthesizer", 1.77]], null, [["music", 82.73], ["swing music", 2.61], ["musical instrument", 2.3]], [["music", 57.6], ["musical instrument", 10.86], ["brass instrument", 4.85]]], "duration": [14.0, 1.14, 5.37, 0.92, 5.49, 7.59, 3.06, 3.68, 4.13, 3.37, 0.92, 19.51, 2.65, 3.13, 4.74, 10.98, 16.15, 1.07, 13.38, 4.68]} \ No newline at end of file diff --git a/annotations_filtered/jsZkkqLDFmg_filtered.json b/annotations_filtered/jsZkkqLDFmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41b0c88944852a5ddbfccaa33ddff8b7f5572980 --- /dev/null +++ b/annotations_filtered/jsZkkqLDFmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.83], [7.0, 22.45], [23.0, 27.63], [29.0, 35.01], [36.0, 38.13], [40.0, 40.93], [42.0, 42.11], [44.0, 44.83], [46.0, 46.28], [48.0, 50.68], [52.0, 54.62], [55.0, 55.76], [56.0, 57.35], [61.0, 62.78], [66.0, 70.6], [71.0, 72.32], [74.0, 74.43], [80.0, 81.43], [82.0, 83.44], [86.0, 86.39], [89.0, 89.46], [91.0, 91.56], [94.0, 95.2], [96.0, 97.58], [99.0, 100.21], [100.0, 101.12], [104.0, 103.71], [105.0, 105.93], [109.0, 110.81], [113.0, 113.24], [115.0, 115.5], [118.0, 118.2], [119.0, 119.69], [129.0, 130.18], [132.0, 146.42], [148.0, 149.5], [150.0, 154.01], [154.0, 157.84], [159.0, 160.69], [162.0, 163.59], [164.0, 167.17], [168.0, 169.75], [171.0, 171.54], [172.0, 174.09], [175.0, 176.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 53.59, 34.01, 42.79, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 86.09, 0.0, 0.0, 0.0, 37.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.23, 0.0, 100.0, 89.9, 0.0, 0.0, 99.91, 0.0, 0.0, 87.92, 0.0], "audiomae_on_audioset": [null, null, [["speech", 79.11], ["beatboxing", 4.46], ["fart", 2.47]], [["ping", 65.26], ["bouncing", 3.78], ["chop", 3.35]], null, null, null, null, null, null, null, null, null, null, [["sidetone", 49.04], ["sine wave", 18.6], ["dial tone", 16.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.69], ["sine wave", 27.0], ["dial tone", 13.18]], null, null, null, null, null, null, null, null, null, null], "duration": [2.83, 15.45, 4.63, 6.01, 2.13, 0.93, 0.11, 0.83, 0.28, 2.68, 2.62, 0.76, 1.35, 1.78, 4.6, 1.32, 0.43, 1.43, 1.44, 0.39, 0.46, 0.56, 1.2, 1.58, 1.21, 1.12, -0.29, 0.93, 1.81, 0.24, 0.5, 0.2, 0.69, 1.18, 14.42, 1.5, 4.01, 3.84, 1.69, 1.59, 3.17, 1.75, 0.54, 2.09, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/jsbjmWo3c38_filtered.json b/annotations_filtered/jsbjmWo3c38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58a0f66b299d93738408ef49873be4f4b26512c9 --- /dev/null +++ b/annotations_filtered/jsbjmWo3c38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 23.92], [25.0, 32.12], [37.0, 37.94], [41.0, 56.17], [58.0, 64.98], [67.0, 72.54], [74.0, 79.32], [81.0, 81.38], [83.0, 87.08], [90.0, 101.11]], "keep_status": [true, false, false, true, true, true, true, false, true, false], "silence_prob": [46.15, 30.68, 0.0, 30.28, 29.69, 30.16, 34.18, 0.0, 33.61, 30.66], "audiomae_on_audioset": [[["music", 46.71], ["synthesizer", 5.98], ["hum", 4.36]], [["speech", 56.75], ["music", 18.04], ["sidetone", 5.35]], null, [["music", 27.84], ["hum", 17.39], ["mains hum", 10.17]], [["music", 54.81], ["electronic music", 5.96], ["synthesizer", 4.8]], [["music", 46.66], ["noise", 7.29], ["cacophony", 6.34]], [["music", 41.15], ["hum", 8.08], ["mains hum", 5.6]], null, [["music", 21.47], ["speech", 9.23], ["vehicle", 2.32]], [["speech", 62.17], ["music", 11.0], ["didgeridoo", 4.95]]], "duration": [9.92, 7.12, 0.94, 15.17, 6.98, 5.54, 5.32, 0.38, 4.08, 11.11]} \ No newline at end of file diff --git a/annotations_filtered/jsyzJJFZzsg_filtered.json b/annotations_filtered/jsyzJJFZzsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a523935cc8def32ada980c19f86f6ef1c5eab0ec --- /dev/null +++ b/annotations_filtered/jsyzJJFZzsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [10.0, 15.94], [25.0, 26.03], [27.0, 40.05], [65.0, 75.73], [77.0, 81.8], [83.0, 86.51], [87.0, 90.26]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 54.5, 0.0, 40.64, 46.83, 67.13, 70.72, 66.03], "audiomae_on_audioset": [null, null, null, [["music", 52.1], ["cello", 4.96], ["double bass", 3.89]], [["music", 56.54], ["theremin", 14.67], ["musical instrument", 4.03]], null, null, null], "duration": [0.43, 5.94, 1.03, 13.05, 10.73, 4.8, 3.51, 3.26]} \ No newline at end of file diff --git a/annotations_filtered/jsz79bztNJI_filtered.json b/annotations_filtered/jsz79bztNJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eecbd5d2acea0166c2bc1b5993ee6bfec98c4418 --- /dev/null +++ b/annotations_filtered/jsz79bztNJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 21.14], [22.0, 22.65], [23.0, 59.88], [61.0, 81.38]], "keep_status": [true, false, false, true], "silence_prob": [28.55, 0.0, 0.0, 28.65], "audiomae_on_audioset": [[["vehicle", 23.88], ["buzz", 15.71], ["electric shaver, electric razor", 12.69]], null, null, [["music", 33.59], ["mains hum", 15.96], ["hum", 8.54]]], "duration": [18.14, 0.65, 36.88, 20.38]} \ No newline at end of file diff --git a/annotations_filtered/jszED6T4Gik_filtered.json b/annotations_filtered/jszED6T4Gik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb62f1e5fba9b89fc523492c8de6da9046d71161 --- /dev/null +++ b/annotations_filtered/jszED6T4Gik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.91], [4.0, 6.35], [7.0, 8.23], [10.0, 9.98], [14.0, 14.42], [21.0, 21.56], [29.0, 29.37], [31.0, 31.09], [36.0, 36.09], [42.0, 42.92], [53.0, 52.86], [54.0, 54.87], [64.0, 68.64], [70.0, 71.27], [80.0, 82.61], [86.0, 93.83], [99.0, 98.86], [99.0, 117.24], [118.0, 118.79], [119.0, 120.21], [121.0, 121.93], [123.0, 130.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.91, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 56.25, 95.64, 0.0, 80.82, 0.0, 0.0, 0.0, 90.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.91, 2.35, 1.23, -0.02, 0.42, 0.56, 0.37, 0.09, 0.09, 0.92, -0.14, 0.87, 4.64, 1.27, 2.61, 7.83, -0.14, 18.24, 0.79, 1.21, 0.93, 7.23]} \ No newline at end of file diff --git a/annotations_filtered/jt2BPBAWiEQ_filtered.json b/annotations_filtered/jt2BPBAWiEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb22cf7620b93323fbd5f1ac7991f54aa5526c4 --- /dev/null +++ b/annotations_filtered/jt2BPBAWiEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.55], [15.0, 15.63], [19.0, 20.49], [34.0, 36.61], [56.0, 59.24], [61.0, 61.26], [62.0, 62.83], [70.0, 74.31], [79.0, 78.95], [80.0, 80.99], [85.0, 88.38], [90.0, 91.15], [92.0, 95.4]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.54, 50.21, 0.0, 0.0, 46.26, 0.0, 0.0, 34.6, 0.0, 35.77], "audiomae_on_audioset": [null, null, null, [["hum", 33.27], ["throbbing", 25.51], ["music", 20.51]], null, null, null, [["music", 42.14], ["throbbing", 11.67], ["boing", 3.53]], null, null, [["hum", 25.93], ["speech", 18.82], ["mains hum", 10.99]], null, [["speech", 54.35], ["hum", 12.72], ["throbbing", 4.78]]], "duration": [1.55, 0.63, 1.49, 2.61, 3.24, 0.26, 0.83, 4.31, -0.05, 0.99, 3.38, 1.15, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/jtQcr7lJXB0_filtered.json b/annotations_filtered/jtQcr7lJXB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..118f5ed1ffd0fbd85c52aed5037bcfdfe9b354b7 --- /dev/null +++ b/annotations_filtered/jtQcr7lJXB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [5.0, 6.34], [9.0, 9.98], [12.0, 13.27], [17.0, 17.68], [20.0, 21.49], [23.0, 23.06], [26.0, 26.65], [29.0, 29.46], [30.0, 32.8], [34.0, 37.03], [38.0, 38.43], [41.0, 41.67], [46.0, 46.04], [58.0, 58.02], [60.0, 60.32], [62.0, 62.82], [66.0, 68.22], [71.0, 71.9], [75.0, 75.15], [80.0, 80.94], [87.0, 88.08], [89.0, 91.69], [94.0, 94.56], [99.0, 99.03], [105.0, 105.53], [107.0, 107.89], [110.0, 110.46], [115.0, 115.23], [117.0, 122.64], [124.0, 125.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.34, 0.98, 1.27, 0.68, 1.49, 0.06, 0.65, 0.46, 2.8, 3.03, 0.43, 0.67, 0.04, 0.02, 0.32, 0.82, 2.22, 0.9, 0.15, 0.94, 1.08, 2.69, 0.56, 0.03, 0.53, 0.89, 0.46, 0.23, 5.64, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/jtSnHOkSJxM_filtered.json b/annotations_filtered/jtSnHOkSJxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/jtSnHOkSJxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ju9K6nk07iE_filtered.json b/annotations_filtered/ju9K6nk07iE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4c09bcaeb2618060424021e71116d9ff14393be --- /dev/null +++ b/annotations_filtered/ju9K6nk07iE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.77], [19.0, 27.68], [32.0, 44.19], [46.0, 49.82], [51.0, 182.36], [182.0, 186.87], [188.0, 188.32], [191.0, 192.13], [194.0, 199.3], [201.0, 205.11], [206.0, 212.33], [214.0, 218.98], [221.0, 223.13], [225.0, 226.83]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.94, 35.67, 38.47, 0.0, 62.47, 0.0, 0.0, 90.25, 93.13, 87.55, 82.79, 79.59, 0.0], "audiomae_on_audioset": [null, [["music", 71.36], ["theremin", 9.08], ["musical instrument", 2.44]], [["music", 42.62], ["theremin", 8.84], ["piano", 6.32]], [["music", 45.59], ["theremin", 16.92], ["cello", 3.22]], null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 8.68, 12.19, 3.82, 131.36, 4.87, 0.32, 1.13, 5.3, 4.11, 6.33, 4.98, 2.13, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/jusrkQ2Zg8o_filtered.json b/annotations_filtered/jusrkQ2Zg8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2741eeab8d3c86ff1ecf5a7807ff9f99df6e36c0 --- /dev/null +++ b/annotations_filtered/jusrkQ2Zg8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [1.0, 1.54], [6.0, 9.58], [11.0, 14.0], [16.0, 17.09], [19.0, 19.55], [21.0, 22.32], [29.0, 42.3], [43.0, 47.16], [50.0, 76.74]], "keep_status": [false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 50.51, 43.2, 0.0, 0.0, 0.0, 55.96, 31.02, 31.28], "audiomae_on_audioset": [null, null, null, [["music", 27.4], ["hum", 20.26], ["mains hum", 10.28]], null, null, null, null, [["speech", 29.69], ["gunshot, gunfire", 21.36], ["fusillade", 4.81]], [["music", 50.69], ["throbbing", 16.83], ["hum", 9.21]]], "duration": [0.36, 0.54, 3.58, 3.0, 1.09, 0.55, 1.32, 13.3, 4.16, 26.74]} \ No newline at end of file diff --git a/annotations_filtered/jutOpRQ7Osg_filtered.json b/annotations_filtered/jutOpRQ7Osg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0dfb1665afffb6f3cad8fbbc4d627a90677f50 --- /dev/null +++ b/annotations_filtered/jutOpRQ7Osg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.0], [14.0, 15.38], [16.0, 16.46], [18.0, 21.96], [27.0, 30.7], [32.0, 35.46], [39.0, 45.42], [46.0, 47.09], [48.0, 49.0], [49.0, 49.4], [50.0, 50.48], [57.0, 58.31], [60.0, 63.09], [70.0, 71.0], [72.0, 72.71], [78.0, 78.46], [80.0, 80.43], [81.0, 82.61], [84.0, 85.46], [90.0, 91.23], [93.0, 94.59], [98.0, 99.47], [100.0, 101.06], [103.0, 104.19], [107.0, 107.38], [110.0, 111.81], [113.0, 114.79], [123.0, 123.89], [147.0, 148.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.25, 51.71, 73.97, 71.43, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.38, 0.46, 3.96, 3.7, 3.46, 6.42, 1.09, 1.0, 0.4, 0.48, 1.31, 3.09, 1.0, 0.71, 0.46, 0.43, 1.61, 1.46, 1.23, 1.59, 1.47, 1.06, 1.19, 0.38, 1.81, 1.79, 0.89, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/juw328OfWnM_filtered.json b/annotations_filtered/juw328OfWnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..807c97e1cd351d046789ece7baf4e1e579f3287a --- /dev/null +++ b/annotations_filtered/juw328OfWnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.99], [8.0, 10.64], [12.0, 13.85], [17.0, 17.32], [20.0, 20.38], [22.0, 25.2], [26.0, 28.07], [31.0, 32.95], [34.0, 35.99], [38.0, 39.28], [43.0, 43.5], [53.0, 53.89], [56.0, 57.7], [61.0, 62.36], [68.0, 68.96], [73.0, 74.34], [78.0, 81.68], [85.0, 86.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 83.52, 0.0, 0.0, 0.0, 85.72, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 2.64, 1.85, 0.32, 0.38, 3.2, 2.07, 1.95, 1.99, 1.28, 0.5, 0.89, 1.7, 1.36, 0.96, 1.34, 3.68, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/jv2MsLBMi9U_filtered.json b/annotations_filtered/jv2MsLBMi9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4ed1700c8df768ca856ff94ed8dfa3633ac9a82 --- /dev/null +++ b/annotations_filtered/jv2MsLBMi9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [6.0, 6.88], [8.0, 8.4], [11.0, 11.21], [13.0, 13.64], [15.0, 15.96], [17.0, 17.19], [19.0, 18.67], [20.0, 20.71], [22.0, 25.1], [26.0, 26.55], [27.0, 28.43], [30.0, 30.92], [34.0, 33.99], [37.0, 37.72], [40.0, 48.44], [52.0, 53.92], [55.0, 56.32], [57.0, 58.75], [65.0, 64.86], [65.0, 65.45], [71.0, 73.85], [82.0, 82.14], [85.0, 85.83], [88.0, 87.98], [90.0, 92.1], [97.0, 100.85], [102.0, 108.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.88, 0.4, 0.21, 0.64, 0.96, 0.19, -0.33, 0.71, 3.1, 0.55, 1.43, 0.92, -0.01, 0.72, 8.44, 1.92, 1.32, 1.75, -0.14, 0.45, 2.85, 0.14, 0.83, -0.02, 2.1, 3.85, 6.06]} \ No newline at end of file diff --git a/annotations_filtered/jv6-p4kphmc_filtered.json b/annotations_filtered/jv6-p4kphmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59975c974620a2320a328ceeb4cabfa661be0865 --- /dev/null +++ b/annotations_filtered/jv6-p4kphmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.18], [16.0, 19.09], [21.0, 21.68], [23.0, 23.4], [24.0, 26.45], [28.0, 34.79], [36.0, 37.79], [39.0, 58.38], [59.0, 60.69], [61.0, 69.74], [75.0, 76.06], [79.0, 81.48], [82.0, 87.27], [89.0, 89.36], [96.0, 97.95], [100.0, 101.26], [102.0, 102.68], [107.0, 107.25], [108.0, 108.24], [109.0, 109.59], [111.0, 116.83], [118.0, 120.38], [121.0, 125.88], [129.0, 130.11], [131.0, 131.85], [133.0, 133.78], [134.0, 135.18]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 85.72, 0.0, 0.0, 42.11, 85.9, 0.0, 96.54, 0.0, 87.19, 0.0, 51.23, 51.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 42.22, 63.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 21.62], ["hum", 20.74], ["music", 14.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.83], ["musical instrument", 6.72], ["speech", 3.94]], null, null, null, null, null], "duration": [1.18, 3.09, 0.68, 0.4, 2.45, 6.79, 1.79, 19.38, 1.69, 8.74, 1.06, 2.48, 5.27, 0.36, 1.95, 1.26, 0.68, 0.25, 0.24, 0.59, 5.83, 2.38, 4.88, 1.11, 0.85, 0.78, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/jvBp6TqoHWw_filtered.json b/annotations_filtered/jvBp6TqoHWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95e81567ed467e6a5a615beb33e98cd609e28daf --- /dev/null +++ b/annotations_filtered/jvBp6TqoHWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [3.0, 3.79], [5.0, 5.19], [11.0, 14.2], [15.0, 18.62], [22.0, 22.25], [24.0, 25.44], [27.0, 27.36], [30.0, 31.36], [34.0, 34.38], [34.0, 34.42], [34.0, 35.26], [44.0, 44.46], [48.0, 48.03], [50.0, 50.38], [51.0, 51.12], [52.0, 52.51], [55.0, 55.36], [56.0, 63.53], [65.0, 65.45], [75.0, 74.97], [76.0, 76.65], [87.0, 87.83], [89.0, 89.43], [89.0, 89.46], [90.0, 90.46], [93.0, 97.26], [100.0, 102.52], [109.0, 110.44], [111.0, 111.37], [112.0, 111.97], [115.0, 117.14], [118.0, 119.26], [120.0, 120.83], [123.0, 129.78], [131.0, 132.0], [132.0, 133.83], [135.0, 136.11], [138.0, 137.64], [140.0, 140.81], [143.0, 143.82], [144.0, 146.42], [150.0, 152.66], [154.0, 154.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 95.23, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 87.0, 0.0, 0.0, 0.0, 45.24, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 39.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.97], ["music", 32.79], ["sidetone", 3.99]], null, null, [["music", 50.79], ["thunk", 18.93], ["musical instrument", 4.15]], null, null, null, null, null, null, null, [["music", 38.54], ["trombone", 12.03], ["brass instrument", 6.25]], null], "duration": [0.51, 0.79, 0.19, 3.2, 3.62, 0.25, 1.44, 0.36, 1.36, 0.38, 0.42, 1.26, 0.46, 0.03, 0.38, 0.12, 0.51, 0.36, 7.53, 0.45, -0.03, 0.65, 0.83, 0.43, 0.46, 0.46, 4.26, 2.52, 1.44, 0.37, -0.03, 2.14, 1.26, 0.83, 6.78, 1.0, 1.83, 1.11, -0.36, 0.81, 0.82, 2.42, 2.66, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/jvZk0rzVeBw_filtered.json b/annotations_filtered/jvZk0rzVeBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..312c3e66730f1e52a081aa3f66881bf89058a157 --- /dev/null +++ b/annotations_filtered/jvZk0rzVeBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [6.0, 7.99], [12.0, 14.52], [16.0, 17.49], [18.0, 19.45], [21.0, 21.79], [25.0, 25.17], [28.0, 29.66], [31.0, 32.66], [38.0, 38.64], [41.0, 43.66], [46.0, 47.28], [48.0, 49.77], [54.0, 55.31], [58.0, 58.78], [61.0, 63.02], [65.0, 65.42], [68.0, 68.55], [70.0, 71.31], [76.0, 78.31], [83.0, 84.3], [85.0, 93.45], [96.0, 98.83], [99.0, 102.41], [104.0, 106.19], [107.0, 107.7], [109.0, 111.2], [114.0, 114.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.49, 0.0, 35.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.93, 0.0, 0.0, 0.0, 0.0, 36.79, 0.0, 0.0, 0.0, 32.96, 0.0, 36.11, 34.56, 33.46, 37.74, 0.0, 35.95, 0.0], "audiomae_on_audioset": [[["music", 68.38], ["synthesizer", 3.94], ["musical instrument", 3.83]], null, [["music", 48.75], ["speech", 3.82], ["animal", 2.91]], null, null, null, null, null, null, null, [["music", 67.81], ["musical instrument", 4.96], ["guitar", 4.15]], null, null, null, null, [["music", 51.39], ["didgeridoo", 8.3], ["musical instrument", 4.88]], null, null, null, [["speech", 37.86], ["music", 31.23], ["singing bowl", 4.86]], null, [["music", 61.84], ["synthesizer", 10.36], ["theremin", 4.23]], [["music", 79.22], ["grunt", 3.95], ["didgeridoo", 1.53]], [["music", 43.47], ["speech", 19.38], ["synthesizer", 5.0]], [["music", 61.37], ["theremin", 13.11], ["musical instrument", 5.75]], null, [["music", 71.75], ["musical instrument", 5.36], ["synthesizer", 3.8]], null], "duration": [2.16, 1.99, 2.52, 1.49, 1.45, 0.79, 0.17, 1.66, 1.66, 0.64, 2.66, 1.28, 1.77, 1.31, 0.78, 2.02, 0.42, 0.55, 1.31, 2.31, 1.3, 8.45, 2.83, 3.41, 2.19, 0.7, 2.2, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/jw41pJtU6eY_filtered.json b/annotations_filtered/jw41pJtU6eY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4368565fa9b51676405d837136c904a3c3dd8de --- /dev/null +++ b/annotations_filtered/jw41pJtU6eY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [7.0, 7.91], [8.0, 8.82], [10.0, 18.71], [21.0, 21.46], [24.0, 24.43], [25.0, 26.77], [27.0, 30.23], [34.0, 39.53], [40.0, 41.89], [46.0, 50.03], [51.0, 52.07], [53.0, 53.74], [56.0, 57.06], [63.0, 63.85], [67.0, 68.79], [71.0, 78.63], [84.0, 85.65], [88.0, 93.83], [96.0, 99.55], [104.0, 107.28], [109.0, 109.31], [112.0, 121.63]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.34, 0.0, 0.0, 0.0, 41.1, 31.39, 0.0, 32.32, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 37.49, 34.09, 43.38, 0.0, 34.78], "audiomae_on_audioset": [null, null, null, [["music", 66.07], ["throbbing", 9.4], ["synthesizer", 9.17]], null, null, null, [["music", 30.05], ["didgeridoo", 14.88], ["foghorn", 13.71]], [["music", 37.98], ["theremin", 12.63], ["synthesizer", 9.71]], null, [["music", 39.83], ["speech", 39.69], ["eruption", 2.57]], null, null, null, null, null, [["music", 50.59], ["theremin", 6.52], ["throbbing", 5.69]], null, [["music", 53.25], ["didgeridoo", 4.89], ["hum", 4.12]], [["music", 35.27], ["brass instrument", 21.68], ["trombone", 18.08]], [["speech", 23.37], ["music", 16.68], ["synthesizer", 7.17]], null, [["music", 48.94], ["throbbing", 20.82], ["timpani", 3.81]]], "duration": [0.65, 0.91, 0.82, 8.71, 0.46, 0.43, 1.77, 3.23, 5.53, 1.89, 4.03, 1.07, 0.74, 1.06, 0.85, 1.79, 7.63, 1.65, 5.83, 3.55, 3.28, 0.31, 9.63]} \ No newline at end of file diff --git a/annotations_filtered/jwjCPSUGPXU_filtered.json b/annotations_filtered/jwjCPSUGPXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd04fc0b908ee03dd9e7bb51ca9c35abb44e8706 --- /dev/null +++ b/annotations_filtered/jwjCPSUGPXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [10.0, 11.69], [16.0, 17.58], [21.0, 22.38], [23.0, 24.58], [25.0, 27.04], [32.0, 32.58], [34.0, 34.4], [40.0, 40.74], [48.0, 49.5], [52.0, 52.56], [54.0, 56.03], [61.0, 60.69], [70.0, 72.23], [75.0, 78.44]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 0.0, 36.27, 57.01], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 29.39], ["music", 17.39], ["hum", 10.42]], null, null, null, null, null, [["whale vocalization", 30.24], ["music", 13.29], ["frog", 6.99]], null, [["grunt", 34.34], ["speech", 9.8], ["animal", 6.29]], null], "duration": [0.28, 1.69, 1.58, 1.38, 1.58, 2.04, 0.58, 0.4, 0.74, 1.5, 0.56, 2.03, -0.31, 2.23, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/jwnPI-d36vU_filtered.json b/annotations_filtered/jwnPI-d36vU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e027c639309c03de8dd9e1e645b2a2d15295a2 --- /dev/null +++ b/annotations_filtered/jwnPI-d36vU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.25], [31.0, 32.22], [33.0, 34.57], [36.0, 37.54], [38.0, 41.99], [43.0, 44.09], [45.0, 63.42], [64.0, 69.65], [70.0, 71.69], [72.0, 74.63], [77.0, 78.36], [80.0, 97.71], [98.0, 98.52], [101.0, 108.73], [110.0, 115.28], [118.0, 120.7], [122.0, 121.98], [122.0, 122.12], [122.0, 132.53], [133.0, 134.6], [136.0, 136.11], [141.0, 142.06], [144.0, 152.49]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [31.9, 0.0, 0.0, 0.0, 34.16, 0.0, 37.13, 39.01, 0.0, 34.98, 0.0, 31.04, 0.0, 30.18, 37.43, 36.57, 0.0, 0.0, 40.36, 0.0, 0.0, 0.0, 62.17], "audiomae_on_audioset": [[["music", 17.98], ["sound effect", 7.57], ["roar", 6.03]], null, null, null, [["noise", 77.11], ["music", 7.52], ["synthesizer", 1.63]], null, [["music", 38.95], ["didgeridoo", 10.51], ["noise", 9.83]], [["whale vocalization", 29.69], ["music", 25.91], ["speech", 7.88]], null, [["thunk", 42.94], ["whack, thwack", 15.0], ["music", 13.4]], null, [["music", 20.3], ["hum", 16.83], ["livestock, farm animals, working animals", 10.39]], null, [["music", 13.58], ["electric shaver, electric razor", 7.24], ["whack, thwack", 6.96]], [["hum", 28.71], ["music", 18.65], ["throbbing", 10.2]], [["speech", 43.58], ["music", 25.39], ["fart", 7.2]], null, null, [["speech", 44.61], ["music", 35.73], ["hum", 3.48]], null, null, null, null], "duration": [3.25, 1.22, 1.57, 1.54, 3.99, 1.09, 18.42, 5.65, 1.69, 2.63, 1.36, 17.71, 0.52, 7.73, 5.28, 2.7, -0.02, 0.12, 10.53, 1.6, 0.11, 1.06, 8.49]} \ No newline at end of file diff --git a/annotations_filtered/jwrWJXtNYWU_filtered.json b/annotations_filtered/jwrWJXtNYWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bff0ac16f288b476cdb82d186fc020be7b84677c --- /dev/null +++ b/annotations_filtered/jwrWJXtNYWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [8.0, 9.61], [10.0, 10.61], [17.0, 17.24], [25.0, 24.76], [28.0, 28.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.97, 1.61, 0.61, 0.24, -0.24, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/jx6Rgn1ioAk_filtered.json b/annotations_filtered/jx6Rgn1ioAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f34c8b8ed1940346c53ca8522b5fd08ad353aec3 --- /dev/null +++ b/annotations_filtered/jx6Rgn1ioAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [11.0, 18.23]], "keep_status": [false, false], "silence_prob": [0.0, 31.37], "audiomae_on_audioset": [null, [["music", 81.63], ["musical instrument", 3.47], ["singing", 3.18]]], "duration": [0.6, 7.23]} \ No newline at end of file diff --git a/annotations_filtered/jx757TP9spg_filtered.json b/annotations_filtered/jx757TP9spg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e5af9a688310232e1584c7af92904f097d8c6dd --- /dev/null +++ b/annotations_filtered/jx757TP9spg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.44], [15.0, 15.62], [26.0, 26.33], [27.0, 27.28], [31.0, 33.22], [36.0, 44.51], [45.0, 45.69], [56.0, 56.76], [62.0, 62.46], [84.0, 85.4], [91.0, 96.52], [97.0, 99.23], [99.0, 100.84], [102.0, 102.2], [103.0, 103.69], [106.0, 108.63], [109.0, 110.91], [112.0, 114.0], [118.0, 118.17], [127.0, 139.14], [142.0, 145.02], [147.0, 147.8], [152.0, 155.68], [158.0, 158.57], [159.0, 160.05], [162.0, 163.12], [164.0, 166.31], [166.0, 166.45]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.68, 33.59, 0.0, 0.0, 0.0, 0.0, 97.92, 88.28, 0.0, 0.0, 0.0, 82.25, 0.0, 100.0, 0.0, 99.56, 99.68, 0.0, 96.77, 0.0, 0.0, 0.0, 32.91, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 42.31], ["music", 18.06], ["boing", 4.33]], [["speech", 51.23], ["whack, thwack", 8.92], ["fart", 6.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["beatboxing", 26.52], ["inside, small room", 6.9], ["speech", 6.46]], null], "duration": [1.44, 0.62, 0.33, 0.28, 2.22, 8.51, 0.69, 0.76, 0.46, 1.4, 5.52, 2.23, 1.84, 0.2, 0.69, 2.63, 1.91, 2.0, 0.17, 12.14, 3.02, 0.8, 3.68, 0.57, 1.05, 1.12, 2.31, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/jyDUZd-Orlc_filtered.json b/annotations_filtered/jyDUZd-Orlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba04fcb6c4968a359bec10154a7ed616f3404682 --- /dev/null +++ b/annotations_filtered/jyDUZd-Orlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.42], [15.0, 20.49], [21.0, 26.08], [27.0, 27.26], [30.0, 68.22], [69.0, 82.98], [84.0, 86.46], [92.0, 92.94], [95.0, 96.23], [98.0, 106.2], [107.0, 107.45], [108.0, 109.36], [110.0, 113.66], [115.0, 160.42], [161.0, 161.25], [162.0, 162.99], [163.0, 175.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [99.4, 67.13, 92.31, 0.0, 0.0, 28.91, 30.12, 0.0, 0.0, 28.65, 0.0, 0.0, 29.12, 0.0, 0.0, 0.0, 41.91], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 73.13], ["music", 11.7], ["electronic music", 1.35]], [["music", 55.89], ["throbbing", 9.53], ["speech", 4.94]], null, null, [["speech", 46.06], ["music", 40.55], ["hum", 3.02]], null, null, [["music", 27.55], ["speech", 18.95], ["hum", 13.48]], null, null, null, [["music", 33.02], ["gasp", 11.33], ["groan", 10.0]]], "duration": [4.42, 5.49, 5.08, 0.26, 38.22, 13.98, 2.46, 0.94, 1.23, 8.2, 0.45, 1.36, 3.66, 45.42, 0.25, 0.99, 12.85]} \ No newline at end of file diff --git a/annotations_filtered/jyNtMzHeJ6I_filtered.json b/annotations_filtered/jyNtMzHeJ6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1294b72e7b253889550d8c08c77dc42a3e6439ee --- /dev/null +++ b/annotations_filtered/jyNtMzHeJ6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.09], [16.0, 16.97], [26.0, 26.7], [29.0, 30.27], [33.0, 34.42], [35.0, 36.9], [41.0, 43.28], [43.0, 43.46], [43.0, 47.12], [49.0, 50.08], [51.0, 51.83], [60.0, 61.16], [64.0, 64.5], [66.0, 67.76], [69.0, 74.38], [77.0, 77.82], [79.0, 79.93], [82.0, 82.46], [85.0, 95.44], [98.0, 99.45], [102.0, 102.74], [103.0, 110.0], [113.0, 116.72], [119.0, 120.73], [122.0, 123.08], [129.0, 130.67], [134.0, 135.45], [138.0, 138.01], [141.0, 141.71], [150.0, 150.42], [154.0, 154.99], [161.0, 161.4], [167.0, 172.35], [173.0, 175.24]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 0.0, 0.0, 30.53, 0.0, 0.0, 29.95, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.57, 63.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 45.33], ["hum", 15.34], ["music", 9.02]], null, null, null, null, null, [["speech", 38.53], ["music", 18.76], ["thunk", 3.15]], null, null, null, [["music", 70.5], ["hip hop music", 4.92], ["electronic music", 4.55]], null, null, [["music", 77.46], ["electronic music", 4.33], ["hip hop music", 2.73]], null, null, null, null, null, null, null, null, null, null, [["speech", 67.21], ["sidetone", 5.21], ["music", 3.99]], null], "duration": [7.09, 0.97, 0.7, 1.27, 1.42, 1.9, 2.28, 0.46, 4.12, 1.08, 0.83, 1.16, 0.5, 1.76, 5.38, 0.82, 0.93, 0.46, 10.44, 1.45, 0.74, 7.0, 3.72, 1.73, 1.08, 1.67, 1.45, 0.01, 0.71, 0.42, 0.99, 0.4, 5.35, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/jyO1ILQAGsU_filtered.json b/annotations_filtered/jyO1ILQAGsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..287a5083b2800d66b4b94bd4d10a5a9176087d15 --- /dev/null +++ b/annotations_filtered/jyO1ILQAGsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.29], [9.0, 14.74], [15.0, 16.95], [19.0, 19.3], [20.0, 20.68], [22.0, 23.58], [32.0, 41.89], [43.0, 43.55], [46.0, 47.14], [48.0, 48.71], [50.0, 50.67], [57.0, 58.46], [61.0, 61.25], [62.0, 62.73], [67.0, 68.07], [73.0, 73.7], [75.0, 76.03], [87.0, 87.88], [97.0, 97.75], [103.0, 103.45], [107.0, 107.77], [109.0, 109.61], [113.0, 113.78], [115.0, 118.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 98.19, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.29, 5.74, 1.95, 0.3, 0.68, 1.58, 9.89, 0.55, 1.14, 0.71, 0.67, 1.46, 0.25, 0.73, 1.07, 0.7, 1.03, 0.88, 0.75, 0.45, 0.77, 0.61, 0.78, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/jyZU7lfGjyk_filtered.json b/annotations_filtered/jyZU7lfGjyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6119a69b1a330704e0b617b0f1e3ed6ffd92fde1 --- /dev/null +++ b/annotations_filtered/jyZU7lfGjyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [9.0, 139.11]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.64, 130.11]} \ No newline at end of file diff --git a/annotations_filtered/jypAc6XYFfA_filtered.json b/annotations_filtered/jypAc6XYFfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d11ffd1b76ac30754270cb23058b39f15b390ad --- /dev/null +++ b/annotations_filtered/jypAc6XYFfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.43], [7.0, 8.11], [17.0, 20.31], [23.0, 23.95], [28.0, 29.3], [33.0, 39.95], [40.0, 51.53], [53.0, 54.46], [57.0, 57.81], [61.0, 64.23], [65.0, 68.67], [70.0, 78.88], [81.0, 84.65], [85.0, 85.72], [86.0, 102.05], [106.0, 112.62], [115.0, 116.23]], "keep_status": [true, false, true, false, false, false, true, false, false, true, false, false, true, false, false, true, false], "silence_prob": [45.3, 0.0, 43.77, 0.0, 0.0, 39.41, 44.43, 0.0, 0.0, 43.08, 43.82, 41.4, 32.87, 0.0, 34.65, 34.08, 0.0], "audiomae_on_audioset": [[["hum", 20.99], ["mains hum", 17.67], ["speech", 12.99]], null, [["speech", 18.92], ["rumble", 17.02], ["hum", 7.17]], null, null, [["speech", 58.7], ["music", 9.64], ["didgeridoo", 9.54]], [["hum", 35.68], ["mains hum", 29.23], ["throbbing", 4.19]], null, null, [["music", 14.19], ["hum", 13.34], ["sine wave", 7.57]], [["sine wave", 61.98], ["chirp tone", 14.44], ["singing bowl", 8.59]], [["hum", 36.9], ["music", 21.9], ["mains hum", 20.86]], [["music", 44.92], ["musical instrument", 6.49], ["hum", 4.61]], null, [["speech", 34.52], ["throbbing", 29.07], ["hum", 15.25]], [["music", 33.06], ["hum", 18.28], ["throbbing", 10.28]], null], "duration": [3.43, 1.11, 3.31, 0.95, 1.3, 6.95, 11.53, 1.46, 0.81, 3.23, 3.67, 8.88, 3.65, 0.72, 16.05, 6.62, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/jz4VT9zHLTU_filtered.json b/annotations_filtered/jz4VT9zHLTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7e837af219639edca178fff8a06802b12582a33 --- /dev/null +++ b/annotations_filtered/jz4VT9zHLTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.81], [7.0, 8.92], [11.0, 11.84]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.81, 1.92, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/jzEhVsME8p4_filtered.json b/annotations_filtered/jzEhVsME8p4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fba31ee8aa209948376f64ed97eacc4003e2571a --- /dev/null +++ b/annotations_filtered/jzEhVsME8p4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [8.0, 8.14], [11.0, 11.28], [13.0, 14.25], [19.0, 19.9], [25.0, 28.24], [34.0, 34.47], [35.0, 35.02], [36.0, 36.78], [38.0, 38.2], [42.0, 45.01], [46.0, 46.53], [48.0, 48.9], [50.0, 50.18], [51.0, 62.82], [63.0, 63.69], [64.0, 66.29], [68.0, 71.0], [73.0, 74.85], [76.0, 76.35], [79.0, 80.79], [85.0, 85.43], [93.0, 93.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0, 0.0, 0.0, 40.77, 0.0, 41.16, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 36.95], ["music", 25.64], ["synthesizer", 10.93]], null, null, null, [["music", 57.2], ["didgeridoo", 7.48], ["synthesizer", 7.29]], null, [["music", 43.87], ["speech", 29.49], ["throbbing", 10.06]], [["music", 65.26], ["timpani", 3.78], ["theremin", 3.37]], null, null, null, null, null], "duration": [1.04, 0.14, 0.28, 1.25, 0.9, 3.24, 0.47, 0.02, 0.78, 0.2, 3.01, 0.53, 0.9, 0.18, 11.82, 0.69, 2.29, 3.0, 1.85, 0.35, 1.79, 0.43, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/jzhXtCHYrAM_filtered.json b/annotations_filtered/jzhXtCHYrAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b624f04b1f0e96d700f49e85623e9ceb72f9c9f3 --- /dev/null +++ b/annotations_filtered/jzhXtCHYrAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.98], [20.0, 22.06], [23.0, 26.76], [28.0, 37.61], [38.0, 38.69], [40.0, 48.05], [50.0, 50.62], [54.0, 54.36], [55.0, 56.03], [58.0, 59.44], [60.0, 61.25], [63.0, 62.73], [65.0, 66.09], [68.0, 67.71], [69.0, 68.82], [70.0, 70.68], [73.0, 73.01], [76.0, 77.41], [78.0, 80.77], [92.0, 94.32], [96.0, 97.23], [100.0, 108.26], [111.0, 113.83], [119.0, 121.05], [130.0, 130.64], [145.0, 148.71], [153.0, 154.3], [156.0, 159.41], [164.0, 166.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.45, 90.25, 95.23, 92.31, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 89.19, 0.0, 99.92, 81.89, 95.51, 0.0, 99.76, 0.0, 96.54, 39.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 36.19], ["moo", 34.27], ["livestock, farm animals, working animals", 24.83]]], "duration": [5.98, 2.06, 3.76, 9.61, 0.69, 8.05, 0.62, 0.36, 1.03, 1.44, 1.25, -0.27, 1.09, -0.29, -0.18, 0.68, 0.01, 1.41, 2.77, 2.32, 1.23, 8.26, 2.83, 2.05, 0.64, 3.71, 1.3, 3.41, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/jzxMo2UKUKM_filtered.json b/annotations_filtered/jzxMo2UKUKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef9cee8507871329c8e2e4985401d3109005672 --- /dev/null +++ b/annotations_filtered/jzxMo2UKUKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 81.57], [83.0, 83.61], [88.0, 90.0], [92.0, 117.12], [123.0, 126.22], [133.0, 136.22], [141.0, 143.65], [144.0, 146.13], [148.0, 149.07]], "keep_status": [false, false, true, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 29.79, 28.87, 28.99, 31.08, 30.92, 32.06, 0.0], "audiomae_on_audioset": [null, null, [["music", 24.07], ["speech", 21.76], ["mains hum", 10.93]], [["music", 29.78], ["hum", 17.72], ["mains hum", 14.57]], [["sound effect", 13.48], ["explosion", 11.14], ["cacophony", 10.47]], [["music", 47.0], ["hum", 13.44], ["throbbing", 10.68]], [["music", 35.33], ["hum", 14.81], ["throbbing", 13.01]], [["noise", 26.38], ["hum", 16.36], ["music", 11.65]], null], "duration": [72.57, 0.61, 2.0, 25.12, 3.22, 3.22, 2.65, 2.13, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/k-RHqxyYzMo_filtered.json b/annotations_filtered/k-RHqxyYzMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8455a92819428ecf831da1cef5d8b86798589a7 --- /dev/null +++ b/annotations_filtered/k-RHqxyYzMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 35.11], [40.0, 125.96]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [30.11, 85.96]} \ No newline at end of file diff --git a/annotations_filtered/k-Rg51azVlg_filtered.json b/annotations_filtered/k-Rg51azVlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6751aa85269a38f309e3df6e4ba9a68971583743 --- /dev/null +++ b/annotations_filtered/k-Rg51azVlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.39], [13.0, 14.98], [18.0, 17.95], [20.0, 23.94], [26.0, 38.43], [40.0, 49.99], [53.0, 56.89], [59.0, 58.78], [61.0, 68.82], [69.0, 70.29], [71.0, 71.64], [72.0, 75.57], [76.0, 79.51], [80.0, 80.67], [82.0, 85.5], [86.0, 86.91], [91.0, 99.01], [101.0, 101.19], [102.0, 103.49], [107.0, 108.06]], "keep_status": [false, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.13, 30.25, 32.24, 29.85, 0.0, 33.41, 0.0, 0.0, 87.92, 99.52, 0.0, 33.38, 0.0, 35.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.2], ["cacophony", 31.3], ["noise", 3.42]], [["hum", 20.05], ["mains hum", 11.04], ["music", 10.48]], [["speech", 25.82], ["music", 16.57], ["mains hum", 14.09]], [["whale vocalization", 21.25], ["vehicle", 14.6], ["car", 9.57]], null, [["music", 69.32], ["sound effect", 5.76], ["breaking", 3.13]], null, null, null, null, null, [["speech", 31.61], ["cheering", 17.58], ["crowd", 14.4]], null, [["sidetone", 53.52], ["speech", 39.06], ["music", 2.65]], null, null, null], "duration": [0.39, 1.98, -0.05, 3.94, 12.43, 9.99, 3.89, -0.22, 7.82, 1.29, 0.64, 3.57, 3.51, 0.67, 3.5, 0.91, 8.01, 0.19, 1.49, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/k-WW7ULn8RA_filtered.json b/annotations_filtered/k-WW7ULn8RA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11bd1876e27879cce2c4bb2114b21c07e524a420 --- /dev/null +++ b/annotations_filtered/k-WW7ULn8RA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.15], [56.0, 60.32], [62.0, 64.94], [67.0, 68.79], [72.0, 74.06], [78.0, 80.76], [83.0, 92.35], [94.0, 94.36], [97.0, 98.04], [100.0, 100.08], [109.0, 109.86]], "keep_status": [false, true, true, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 38.43, 36.43, 0.0, 52.86, 45.85, 49.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.92], ["music", 23.61], ["hum", 4.72]], [["music", 26.13], ["speech", 25.06], ["sidetone", 15.8]], null, null, [["music", 22.31], ["hum", 17.34], ["mains hum", 17.07]], [["music", 46.77], ["fly, housefly", 13.78], ["insect", 5.92]], null, null, null, null], "duration": [0.15, 4.32, 2.94, 1.79, 2.06, 2.76, 9.35, 0.36, 1.04, 0.08, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/k-WrZcFJo2k_filtered.json b/annotations_filtered/k-WrZcFJo2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483993a8d7a899a31efa1cd5f3a151c30fdfa474 --- /dev/null +++ b/annotations_filtered/k-WrZcFJo2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.56], [35.0, 35.01], [39.0, 39.85], [46.0, 46.82], [47.0, 48.47], [55.0, 56.59], [60.0, 65.1], [68.0, 70.04], [70.0, 72.39], [79.0, 78.87], [82.0, 87.39], [93.0, 95.1], [96.0, 96.97], [105.0, 105.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.76, 92.97, 59.15, 0.0, 60.42, 81.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 0.01, 0.85, 0.82, 1.47, 1.59, 5.1, 2.04, 2.39, -0.13, 5.39, 2.1, 0.97, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/k-m4QOtv-rQ_filtered.json b/annotations_filtered/k-m4QOtv-rQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06b0803b15e75b116b8ed673a1f7fbdcaa1226b4 --- /dev/null +++ b/annotations_filtered/k-m4QOtv-rQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.09], [23.0, 23.58], [24.0, 24.9], [25.0, 27.16], [28.0, 28.02], [38.0, 38.01], [69.0, 68.72], [86.0, 89.31], [89.0, 89.45], [103.0, 105.24], [111.0, 111.52], [118.0, 118.37], [121.0, 120.99], [127.0, 128.19], [129.0, 130.0], [132.0, 132.46], [137.0, 138.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.1, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 38.16, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cattle, bovinae", 38.8], ["livestock, farm animals, working animals", 33.96], ["moo", 22.16]], null, null, null, null, null, null, null, null, null], "duration": [4.09, 0.58, 0.9, 2.16, 0.02, 0.01, -0.28, 3.31, 0.45, 2.24, 0.52, 0.37, -0.01, 1.19, 1.0, 0.46, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/k-mbJhVl2Xc_filtered.json b/annotations_filtered/k-mbJhVl2Xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d316b9ba2e93620945840cd23c1f13be22dbf43 --- /dev/null +++ b/annotations_filtered/k-mbJhVl2Xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 36.1], [37.0, 39.38], [45.0, 59.8], [60.0, 61.3], [62.0, 63.39], [64.0, 68.74], [69.0, 71.12], [72.0, 73.62], [74.0, 74.56], [82.0, 82.78], [93.0, 94.93]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.95, 32.52, 34.92, 0.0, 0.0, 39.38, 37.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.55], ["drum machine", 6.12], ["boing", 5.58]], [["music", 68.49], ["synthesizer", 10.25], ["drum machine", 7.67]], [["music", 57.75], ["synthesizer", 10.45], ["speech", 5.28]], null, null, [["music", 33.58], ["speech", 16.07], ["mosquito", 5.22]], [["moo", 41.11], ["cattle, bovinae", 39.75], ["livestock, farm animals, working animals", 16.02]], null, null, null, null], "duration": [26.1, 2.38, 14.8, 1.3, 1.39, 4.74, 2.12, 1.62, 0.56, 0.78, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/k-oVuQpjG3s_filtered.json b/annotations_filtered/k-oVuQpjG3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..510e3fc233b846b5e243805d981a9bc2681ade26 --- /dev/null +++ b/annotations_filtered/k-oVuQpjG3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 79.08], [81.0, 81.19]], "keep_status": [false, false], "silence_prob": [96.54, 0.0], "audiomae_on_audioset": [null, null], "duration": [5.08, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/k01VcZkKDME_filtered.json b/annotations_filtered/k01VcZkKDME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de91ae67ce46e87a181ff7d3bde49dfec26b11c0 --- /dev/null +++ b/annotations_filtered/k01VcZkKDME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [10.0, 10.4], [12.0, 12.63], [16.0, 17.36], [20.0, 20.34], [23.0, 23.87], [24.0, 26.22], [28.0, 28.14], [33.0, 37.86], [40.0, 42.84], [45.0, 45.55], [46.0, 46.85], [48.0, 48.41], [49.0, 49.89], [53.0, 53.42], [56.0, 55.9], [56.0, 56.54], [61.0, 61.69], [63.0, 63.81], [65.0, 66.36], [69.0, 69.5], [71.0, 71.71], [74.0, 74.85], [78.0, 78.8], [91.0, 91.18], [93.0, 93.39], [98.0, 99.81], [106.0, 106.44]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.39, 0.0, 99.99, 61.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 47.18], ["animal", 4.89], ["livestock, farm animals, working animals", 4.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 0.4, 0.63, 1.36, 0.34, 0.87, 2.22, 0.14, 4.86, 2.84, 0.55, 0.85, 0.41, 0.89, 0.42, -0.1, 0.54, 0.69, 0.81, 1.36, 0.5, 0.71, 0.85, 0.8, 0.18, 0.39, 1.81, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/k0LLcRLSSlE_filtered.json b/annotations_filtered/k0LLcRLSSlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8044e47670aefdb9bbd54328c490444264d3047e --- /dev/null +++ b/annotations_filtered/k0LLcRLSSlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [4.0, 5.31], [6.0, 6.91], [20.0, 20.39], [24.0, 25.88], [29.0, 30.32], [32.0, 32.85], [44.0, 45.91], [49.0, 51.88], [65.0, 66.18], [69.0, 70.41], [71.0, 81.67], [92.0, 92.69], [97.0, 97.93], [100.0, 102.57], [108.0, 117.22], [120.0, 121.34], [124.0, 126.2], [126.0, 129.34], [130.0, 133.66], [135.0, 154.63], [160.0, 161.89], [167.0, 181.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 30.38, 0.0, 31.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["insect", 27.52], ["speech", 14.97], ["cricket", 11.27]], null, [["music", 69.83], ["speech", 11.43], ["didgeridoo", 7.3]]], "duration": [0.92, 1.31, 0.91, 0.39, 1.88, 1.32, 0.85, 1.91, 2.88, 1.18, 1.41, 10.67, 0.69, 0.93, 2.57, 9.22, 1.34, 2.2, 3.34, 3.66, 19.63, 1.89, 14.14]} \ No newline at end of file diff --git a/annotations_filtered/k0XGlpR6iLc_filtered.json b/annotations_filtered/k0XGlpR6iLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ef3ef9dee001122e7ba2a2010f9ded76bf3841d --- /dev/null +++ b/annotations_filtered/k0XGlpR6iLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.01], [6.0, 6.76], [11.0, 38.72], [43.0, 43.38], [44.0, 45.74], [48.0, 48.24], [49.0, 49.55], [51.0, 52.07], [54.0, 84.01], [85.0, 85.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.01, 0.76, 27.72, 0.38, 1.74, 0.24, 0.55, 1.07, 30.01, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/k0aqHfvHcsc_filtered.json b/annotations_filtered/k0aqHfvHcsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..663c92bbef7359fe58cb48c8755ddce0c0fee19d --- /dev/null +++ b/annotations_filtered/k0aqHfvHcsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [10.0, 10.32], [11.0, 23.82], [25.0, 25.39], [26.0, 40.58], [48.0, 49.94], [53.0, 60.02], [61.0, 61.53], [62.0, 63.0], [67.0, 67.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.39, 0.0, 59.68, 0.0, 50.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.32, 12.82, 0.39, 14.58, 1.94, 7.02, 0.53, 1.0, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/k10DDJ4L2lc_filtered.json b/annotations_filtered/k10DDJ4L2lc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c789e39e0fb9411ada46dc82a2907c4206bc555b --- /dev/null +++ b/annotations_filtered/k10DDJ4L2lc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.35], [10.0, 10.86], [11.0, 13.31], [14.0, 15.7], [17.0, 30.87], [31.0, 32.71], [36.0, 42.67], [43.0, 45.72], [46.0, 47.78], [49.0, 51.07], [53.0, 57.55], [61.0, 65.06], [65.0, 67.0], [68.0, 70.43], [71.0, 73.13], [76.0, 77.21], [78.0, 79.2], [80.0, 148.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.01, 0.0, 99.9, 0.0, 100.0, 100.0, 0.0, 99.65, 100.0, 89.54, 90.6, 97.83, 99.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 0.86, 2.31, 1.7, 13.87, 1.71, 6.67, 2.72, 1.78, 2.07, 4.55, 4.06, 2.0, 2.43, 2.13, 1.21, 1.2, 68.51]} \ No newline at end of file diff --git a/annotations_filtered/k1MdKI8kiXU_filtered.json b/annotations_filtered/k1MdKI8kiXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e8431200400f95fe9e05316b7ef8e51672420a9 --- /dev/null +++ b/annotations_filtered/k1MdKI8kiXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [8.0, 10.69], [13.0, 19.41], [22.0, 30.82], [32.0, 101.22], [110.0, 110.08], [122.0, 123.08], [124.0, 125.05], [127.0, 128.26], [131.0, 131.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.19, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 2.69, 6.41, 8.82, 69.22, 0.08, 1.08, 1.05, 1.26, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/k1WKpdhcJSo_filtered.json b/annotations_filtered/k1WKpdhcJSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e027c487d167d95bb60d8f50249ac9c46dad35b1 --- /dev/null +++ b/annotations_filtered/k1WKpdhcJSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.69], [15.0, 17.63], [19.0, 19.35], [22.0, 26.69], [29.0, 31.08], [32.0, 36.32], [37.0, 38.52], [52.0, 68.55], [72.0, 74.68], [75.0, 77.97], [79.0, 80.76], [88.0, 87.83], [89.0, 91.37], [92.0, 97.04], [98.0, 99.66], [101.0, 102.05], [108.0, 111.05], [112.0, 115.37]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.13, 84.8, 0.0, 66.88, 75.23, 41.85, 0.0, 43.25, 97.92, 91.64, 0.0, 0.0, 68.02, 42.37, 0.0, 0.0, 98.8, 99.31], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 31.71], ["snicker", 13.95], ["giggle", 9.5]], null, [["speech", 55.77], ["frog", 5.23], ["buzz", 4.16]], null, null, null, null, null, [["speech", 61.6], ["busy signal", 5.83], ["chirp tone", 3.43]], null, null, null, null], "duration": [3.69, 2.63, 0.35, 4.69, 2.08, 4.32, 1.52, 16.55, 2.68, 2.97, 1.76, -0.17, 2.37, 5.04, 1.66, 1.05, 3.05, 3.37]} \ No newline at end of file diff --git a/annotations_filtered/k1Xv18Vy-q0_filtered.json b/annotations_filtered/k1Xv18Vy-q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d94d49fb3b9e38105ccd70ff361f36736312ba5 --- /dev/null +++ b/annotations_filtered/k1Xv18Vy-q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.57], [8.0, 8.82], [10.0, 11.13], [14.0, 14.84], [16.0, 16.63], [17.0, 21.49], [23.0, 24.75], [28.0, 28.81], [30.0, 31.75], [33.0, 35.01], [36.0, 37.69], [41.0, 48.83], [50.0, 54.5], [57.0, 57.96], [59.0, 58.73], [59.0, 59.54], [60.0, 61.33], [62.0, 63.81], [66.0, 69.84], [71.0, 72.33], [73.0, 74.16], [76.0, 78.22], [79.0, 80.22], [82.0, 86.44], [87.0, 93.75], [97.0, 99.3], [100.0, 103.77], [105.0, 105.95], [107.0, 107.99], [111.0, 111.28], [114.0, 114.49], [119.0, 124.24], [125.0, 128.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.4, 0.0, 0.0, 0.0, 64.97, 0.0, 59.51, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 84.8, 0.0, 94.66, 91.98, 96.54, 44.46, 0.0, 0.0, 0.0, 0.0, 71.72, 49.09], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 77.68], ["speech", 6.42], ["radio", 6.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 31.84], ["music", 20.42], ["hum", 13.98]], null, null, null, null, null, [["music", 35.68], ["hum", 14.61], ["mains hum", 9.91]]], "duration": [1.57, 0.82, 1.13, 0.84, 0.63, 4.49, 1.75, 0.81, 1.75, 2.01, 1.69, 7.83, 4.5, 0.96, -0.27, 0.54, 1.33, 1.81, 3.84, 1.33, 1.16, 2.22, 1.22, 4.44, 6.75, 2.3, 3.77, 0.95, 0.99, 0.28, 0.49, 5.24, 3.43]} \ No newline at end of file diff --git a/annotations_filtered/k1_OK7cug8I_filtered.json b/annotations_filtered/k1_OK7cug8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acd04b84af02b0cff7cd34dd99731b3d9428454a --- /dev/null +++ b/annotations_filtered/k1_OK7cug8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.77], [5.0, 5.93], [9.0, 10.25], [17.0, 16.82], [19.0, 19.63], [20.0, 20.43], [21.0, 22.0], [28.0, 28.41], [30.0, 31.68], [41.0, 42.52], [47.0, 48.57], [58.0, 60.76], [62.0, 62.29], [64.0, 63.73], [67.0, 67.07], [68.0, 69.04], [70.0, 71.74], [73.0, 74.02], [75.0, 75.83], [80.0, 80.1], [81.0, 81.55], [92.0, 92.65], [94.0, 94.69], [98.0, 98.14], [104.0, 104.92], [107.0, 109.27], [112.0, 116.33], [117.0, 118.15], [128.0, 129.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.93, 1.25, -0.18, 0.63, 0.43, 1.0, 0.41, 1.68, 1.52, 1.57, 2.76, 0.29, -0.27, 0.07, 1.04, 1.74, 1.02, 0.83, 0.1, 0.55, 0.65, 0.69, 0.14, 0.92, 2.27, 4.33, 1.15, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/k1fiQFCN2Zs_filtered.json b/annotations_filtered/k1fiQFCN2Zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9e7fa7af6c6d5f0ba38c791e461b75046ac8aaf --- /dev/null +++ b/annotations_filtered/k1fiQFCN2Zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.45], [13.0, 20.17], [26.0, 33.02], [38.0, 45.6], [46.0, 80.25], [81.0, 82.44], [84.0, 85.26], [88.0, 95.77], [98.0, 103.67], [111.0, 117.19], [119.0, 138.25], [138.0, 142.26], [143.0, 143.95], [145.0, 151.01], [152.0, 175.34], [178.0, 178.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.05, 29.72, 29.93, 0.0, 0.0, 0.0, 29.9, 29.89, 29.52, 29.45, 29.58, 0.0, 29.47, 29.57, 0.0], "audiomae_on_audioset": [null, [["music", 76.77], ["didgeridoo", 3.38], ["boing", 2.29]], [["music", 81.46], ["drum machine", 3.02], ["synthesizer", 1.37]], [["music", 72.65], ["musical instrument", 4.76], ["drum", 3.0]], null, null, null, [["music", 80.12], ["musical instrument", 4.01], ["quack", 2.82]], [["music", 73.62], ["musical instrument", 2.53], ["traditional music", 1.27]], [["music", 82.69], ["musical instrument", 2.91], ["guitar", 1.69]], [["music", 80.62], ["musical instrument", 3.84], ["music of latin america", 2.33]], [["music", 66.28], ["salsa music", 2.93], ["reggae", 2.6]], null, [["music", 78.99], ["didgeridoo", 6.15], ["musical instrument", 5.83]], [["music", 77.82], ["quack", 4.98], ["musical instrument", 3.47]], null], "duration": [0.45, 7.17, 7.02, 7.6, 34.25, 1.44, 1.26, 7.77, 5.67, 6.19, 19.25, 4.26, 0.95, 6.01, 23.34, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/k1pv94Y0fbw_filtered.json b/annotations_filtered/k1pv94Y0fbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36131fe680879c0721d0cee72967aece5fcf38ad --- /dev/null +++ b/annotations_filtered/k1pv94Y0fbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.29], [13.0, 14.45], [17.0, 17.71], [19.0, 20.9], [24.0, 24.22], [24.0, 24.27], [27.0, 27.55], [31.0, 32.66], [35.0, 43.28]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [41.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.14], "audiomae_on_audioset": [[["speech", 26.07], ["whale vocalization", 9.37], ["music", 9.17]], null, null, null, null, null, null, null, [["speech", 35.24], ["breaking", 16.56], ["music", 9.92]]], "duration": [2.29, 1.45, 0.71, 1.9, 0.22, 0.27, 0.55, 1.66, 8.28]} \ No newline at end of file diff --git a/annotations_filtered/k1z5PejkIyY_filtered.json b/annotations_filtered/k1z5PejkIyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bc327161d13bf4d2d270f9a7381d38687e79c5 --- /dev/null +++ b/annotations_filtered/k1z5PejkIyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 5.41], [6.0, 6.47], [7.0, 9.95], [10.0, 10.96], [20.0, 20.9], [24.0, 24.97], [28.0, 28.12], [39.0, 39.29], [40.0, 40.68], [42.0, 42.36], [43.0, 43.97], [47.0, 47.53], [49.0, 48.98], [58.0, 65.77], [66.0, 66.93], [69.0, 69.2], [74.0, 76.28], [92.0, 93.8], [94.0, 95.72], [97.0, 97.48], [105.0, 106.95], [116.0, 115.62], [117.0, 118.69], [123.0, 123.72], [124.0, 124.85], [125.0, 125.74], [129.0, 135.16], [137.0, 137.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.57, 0.0, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.16, 0.0, 0.0, 36.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.06, 0.0], "audiomae_on_audioset": [null, [["speech", 62.27], ["sidetone", 8.45], ["radio", 5.22]], null, [["moo", 36.75], ["cattle, bovinae", 33.34], ["livestock, farm animals, working animals", 14.56]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 19.46], ["insect", 15.94], ["hum", 9.08]], null, null, [["fly, housefly", 25.76], ["insect", 16.18], ["frog", 6.03]], null, null, null, null, null, null, null, null, null, [["music", 59.54], ["speech", 7.14], ["didgeridoo", 5.82]], null], "duration": [0.21, 3.41, 0.47, 2.95, 0.96, 0.9, 0.97, 0.12, 0.29, 0.68, 0.36, 0.97, 0.53, -0.02, 7.77, 0.93, 0.2, 2.28, 1.8, 1.72, 0.48, 1.95, -0.38, 1.69, 0.72, 0.85, 0.74, 6.16, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/k2-SBnbz7pE_filtered.json b/annotations_filtered/k2-SBnbz7pE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8bbf237f65e698f2e66944de2ccba85d6b2f198 --- /dev/null +++ b/annotations_filtered/k2-SBnbz7pE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 67.07], [68.0, 75.88], [79.0, 80.25], [83.0, 84.11], [87.0, 89.4], [90.0, 90.56], [91.0, 94.39], [95.0, 95.3], [96.0, 96.5], [97.0, 96.99], [99.0, 100.09], [102.0, 103.49], [108.0, 117.44], [120.0, 145.98], [151.0, 155.63], [156.0, 161.08], [162.0, 162.95], [164.0, 164.3], [165.0, 166.16]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 33.59, 0.0, 0.0, 50.71, 0.0, 33.04, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 31.89, 37.09, 38.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["buzz", 20.19], ["insect", 12.99], ["hum", 11.88]], null, null, null, null, [["whale vocalization", 53.52], ["fly, housefly", 13.02], ["mosquito", 12.94]], null, null, null, null, null, [["whale vocalization", 53.7], ["rumble", 11.36], ["fart", 4.93]], [["music", 36.14], ["speech", 33.88], ["throbbing", 3.18]], [["speech", 25.45], ["music", 21.06], ["whale vocalization", 14.33]], [["hum", 24.02], ["music", 16.4], ["mains hum", 12.89]], null, null, null], "duration": [1.07, 7.88, 1.25, 1.11, 2.4, 0.56, 3.39, 0.3, 0.5, -0.01, 1.09, 1.49, 9.44, 25.98, 4.63, 5.08, 0.95, 0.3, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/k2C9QOtoreY_filtered.json b/annotations_filtered/k2C9QOtoreY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..233e251bdc44f5340696ef6baad62b423620ef39 --- /dev/null +++ b/annotations_filtered/k2C9QOtoreY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.9], [8.0, 11.18], [13.0, 13.24], [15.0, 15.5], [16.0, 17.22], [23.0, 23.65], [26.0, 26.43], [26.0, 29.2], [31.0, 51.92], [59.0, 86.76], [92.0, 107.6]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 37.69, 0.0, 0.0, 0.0, 0.0, 0.0, 34.85, 31.54, 30.18, 30.92], "audiomae_on_audioset": [null, [["speech", 39.74], ["music", 13.92], ["whistling", 9.77]], null, null, null, null, null, [["music", 48.23], ["speech", 8.28], ["hum", 6.43]], [["speech", 55.8], ["music", 16.89], ["effects unit", 2.02]], [["music", 45.13], ["speech", 39.47], ["outside, urban or manmade", 1.31]], [["livestock, farm animals, working animals", 45.85], ["moo", 21.05], ["cattle, bovinae", 19.59]]], "duration": [-0.1, 3.18, 0.24, 0.5, 1.22, 0.65, 0.43, 3.2, 20.92, 27.76, 15.6]} \ No newline at end of file diff --git a/annotations_filtered/k2NaHBVVYzY_filtered.json b/annotations_filtered/k2NaHBVVYzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..325c0ea63bd5bea560db4eb8c35eca208b3d03d7 --- /dev/null +++ b/annotations_filtered/k2NaHBVVYzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.54], [10.0, 11.5], [15.0, 22.08], [27.0, 27.55], [29.0, 29.15], [31.0, 31.62], [37.0, 37.69], [40.0, 41.57], [43.0, 45.32], [48.0, 49.4], [50.0, 51.73], [58.0, 58.29], [59.0, 59.56], [60.0, 61.25], [63.0, 63.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 39.29], ["mains hum", 21.71], ["throbbing", 9.68]], null, null, null, null, null, [["speech", 71.43], ["field recording", 4.48], ["didgeridoo", 2.59]], null, null, null, null, null, null], "duration": [1.54, 1.5, 7.08, 0.55, 0.15, 0.62, 0.69, 1.57, 2.32, 1.4, 1.73, 0.29, 0.56, 1.25, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/k2PsfXZ3wyY_filtered.json b/annotations_filtered/k2PsfXZ3wyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f5e2d38ade0a43100271ace86c10d4d9c342c9f --- /dev/null +++ b/annotations_filtered/k2PsfXZ3wyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.4], [9.0, 9.78], [13.0, 13.19]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [1.4, 0.78, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/k2QekuUhgIM_filtered.json b/annotations_filtered/k2QekuUhgIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92a2bb51941aa5a9d896203e1660c5caa73801aa --- /dev/null +++ b/annotations_filtered/k2QekuUhgIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 37.0], [37.0, 39.39], [40.0, 44.74], [45.0, 47.06], [48.0, 49.33], [52.0, 102.2], [103.0, 122.96]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 67.76, 47.5, 34.2, 0.0, 0.0, 34.94], "audiomae_on_audioset": [null, null, [["music", 77.97], ["synthesizer", 5.07], ["electronic music", 3.94]], [["speech", 37.34], ["hum", 7.2], ["synthesizer", 5.47]], null, null, [["throbbing", 39.58], ["hum", 39.52], ["mains hum", 7.54]]], "duration": [35.0, 2.39, 4.74, 2.06, 1.33, 50.2, 19.96]} \ No newline at end of file diff --git a/annotations_filtered/k2s7U_7gHtE_filtered.json b/annotations_filtered/k2s7U_7gHtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb4fc3339b6a8dd415ce92e4ed058c51173e61d1 --- /dev/null +++ b/annotations_filtered/k2s7U_7gHtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [3.0, 4.26], [16.0, 17.36], [19.0, 20.29], [22.0, 23.7], [26.0, 28.32], [31.0, 33.84], [35.0, 36.27], [38.0, 38.43], [42.0, 45.72], [47.0, 51.95], [53.0, 60.78], [62.0, 66.02], [69.0, 71.47], [76.0, 76.5], [78.0, 80.18], [82.0, 91.66], [93.0, 95.98], [99.0, 101.21], [105.0, 109.09], [109.0, 110.24], [114.0, 116.75], [117.0, 118.67], [123.0, 123.74], [125.0, 126.08], [140.0, 140.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 83.7, 0.0, 0.0, 97.92, 91.3, 100.0, 63.64, 92.8, 0.0, 99.52, 89.9, 39.09, 88.28, 87.55, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.9], ["music", 20.99], ["hum", 8.65]], null, null, null, null, null, null, null, null], "duration": [0.03, 1.26, 1.36, 1.29, 1.7, 2.32, 2.84, 1.27, 0.43, 3.72, 4.95, 7.78, 4.02, 2.47, 0.5, 2.18, 9.66, 2.98, 2.21, 4.09, 1.24, 2.75, 1.67, 0.74, 1.08, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/k3KR3Wz29FY_filtered.json b/annotations_filtered/k3KR3Wz29FY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4cdb63c563651a9f82a7bd8bdbafaf0d9893181 --- /dev/null +++ b/annotations_filtered/k3KR3Wz29FY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.87], [13.0, 17.71], [18.0, 20.24], [31.0, 31.7], [37.0, 39.02], [42.0, 42.72], [45.0, 56.94], [60.0, 63.24], [82.0, 82.39], [83.0, 89.26], [91.0, 94.54], [99.0, 106.49], [107.0, 107.81], [111.0, 112.14], [116.0, 126.25], [136.0, 136.78], [160.0, 160.61]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.81, 43.79, 0.0, 32.76, 0.0, 29.09, 32.23, 0.0, 29.61, 35.77, 33.55, 0.0, 0.0, 31.54, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.5], ["speech", 14.71], ["mains hum", 12.98]], [["music", 55.59], ["throbbing", 9.09], ["speech", 4.47]], null, [["music", 52.25], ["throbbing", 15.33], ["hum", 3.77]], null, [["music", 66.17], ["hum", 6.33], ["throbbing", 5.33]], [["music", 38.87], ["throbbing", 28.43], ["hum", 16.44]], null, [["music", 47.81], ["speech", 37.15], ["musical instrument", 4.34]], [["music", 36.32], ["throbbing", 27.86], ["hum", 11.27]], [["music", 50.35], ["throbbing", 17.23], ["hum", 5.48]], null, null, [["music", 45.81], ["throbbing", 27.47], ["hum", 13.13]], null, null], "duration": [0.87, 4.71, 2.24, 0.7, 2.02, 0.72, 11.94, 3.24, 0.39, 6.26, 3.54, 7.49, 0.81, 1.14, 10.25, 0.78, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/k3TpBfnaEmI_filtered.json b/annotations_filtered/k3TpBfnaEmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73c356494ef58cb33412fe54a1e40f5a271766e3 --- /dev/null +++ b/annotations_filtered/k3TpBfnaEmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.8], [11.0, 12.06], [13.0, 18.74], [19.0, 29.03], [30.0, 49.28], [50.0, 54.11], [55.0, 59.7], [61.0, 61.62], [63.0, 69.06], [70.0, 70.78], [72.0, 74.73], [77.0, 77.68], [80.0, 81.24], [83.0, 83.17], [85.0, 86.85], [89.0, 89.68], [91.0, 93.97], [100.0, 101.82], [106.0, 109.54], [111.0, 111.32], [112.0, 115.77], [117.0, 125.95], [129.0, 129.76], [132.0, 135.58], [140.0, 142.92], [144.0, 146.37], [147.0, 148.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.25, 56.7, 100.0, 99.98, 65.55, 0.0, 99.99, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 92.31, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 56.89], ["chirp tone", 19.06], ["sidetone", 6.72]], null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 1.06, 5.74, 10.03, 19.28, 4.11, 4.7, 0.62, 6.06, 0.78, 2.73, 0.68, 1.24, 0.17, 1.85, 0.68, 2.97, 1.82, 3.54, 0.32, 3.77, 8.95, 0.76, 3.58, 2.92, 2.37, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/k3oMPqUTxCE_filtered.json b/annotations_filtered/k3oMPqUTxCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..987bd871d70a827e4f0f5b76c14061c5abd00baa --- /dev/null +++ b/annotations_filtered/k3oMPqUTxCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.29], [10.0, 14.22], [16.0, 17.93], [28.0, 28.68], [35.0, 35.23], [44.0, 45.72], [46.0, 47.28], [48.0, 48.49], [59.0, 59.22], [67.0, 67.19], [68.0, 69.8], [81.0, 81.99], [83.0, 86.29], [98.0, 98.79], [102.0, 102.36], [104.0, 105.75], [107.0, 109.38], [112.0, 112.35], [121.0, 132.81], [141.0, 150.53], [152.0, 152.25], [153.0, 154.23], [154.0, 154.97], [156.0, 155.98], [156.0, 156.91], [159.0, 159.46]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.84, 0.0, 0.0, 0.0, 37.3, 0.0, 31.52, 32.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 45.11], ["musical instrument", 10.42], ["guitar", 9.65]], null, null, null, null, null, null, null, null, null, null, [["music", 47.74], ["didgeridoo", 24.14], ["speech", 11.07]], null, null, null, [["music", 45.14], ["speech", 20.32], ["guitar", 6.82]], null, [["moo", 41.81], ["cattle, bovinae", 37.03], ["livestock, farm animals, working animals", 14.26]], [["speech", 14.1], ["moo", 12.65], ["cattle, bovinae", 11.16]], null, null, null, null, null, null], "duration": [1.29, 4.22, 1.93, 0.68, 0.23, 1.72, 1.28, 0.49, 0.22, 0.19, 1.8, 0.99, 3.29, 0.79, 0.36, 1.75, 2.38, 0.35, 11.81, 9.53, 0.25, 1.23, 0.97, -0.02, 0.91, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/k3yUlJtCkJg_filtered.json b/annotations_filtered/k3yUlJtCkJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7de6e36e294ecda9a7cf1e7466204ff51f51d730 --- /dev/null +++ b/annotations_filtered/k3yUlJtCkJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 107.6]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [60.6]} \ No newline at end of file diff --git a/annotations_filtered/k4-CQXg0Z88_filtered.json b/annotations_filtered/k4-CQXg0Z88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e3c9e9c2ce2bc59c3fe24aee0e74d51b66f3032 --- /dev/null +++ b/annotations_filtered/k4-CQXg0Z88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.55], [1.0, 13.66], [14.0, 14.3], [15.0, 22.98], [25.0, 26.47], [31.0, 34.2], [36.0, 37.4], [40.0, 47.97], [54.0, 54.19], [59.0, 61.26], [65.0, 65.26], [67.0, 68.1], [70.0, 73.36], [74.0, 75.41], [78.0, 78.04], [78.0, 89.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.47, 0.0, 79.94, 0.0, 67.89, 0.0, 70.3, 0.0, 98.86, 0.0, 0.0, 96.04, 0.0, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 12.66, 0.3, 7.98, 1.47, 3.2, 1.4, 7.97, 0.19, 2.26, 0.26, 1.1, 3.36, 1.41, 0.04, 11.87]} \ No newline at end of file diff --git a/annotations_filtered/k4X42D5Gg7o_filtered.json b/annotations_filtered/k4X42D5Gg7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5166e50795adfdf881aa8ae37b05587ca94a4f92 --- /dev/null +++ b/annotations_filtered/k4X42D5Gg7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.37], [7.0, 7.38], [12.0, 12.38], [12.0, 12.61], [13.0, 13.02], [13.0, 15.28], [22.0, 22.91], [25.0, 25.56], [29.0, 29.17], [38.0, 38.7], [41.0, 41.1], [46.0, 46.55], [47.0, 48.25], [50.0, 51.44], [55.0, 55.26], [61.0, 61.65], [63.0, 63.49], [66.0, 67.49], [69.0, 70.02], [76.0, 76.01], [88.0, 89.77], [101.0, 101.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.38, 0.38, 0.61, 0.02, 2.28, 0.91, 0.56, 0.17, 0.7, 0.1, 0.55, 1.25, 1.44, 0.26, 0.65, 0.49, 1.49, 1.02, 0.01, 1.77, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/k4YuBxpQwqA_filtered.json b/annotations_filtered/k4YuBxpQwqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af7beeb4c80a2a88bcbbdbd54fef6d03ff64ea35 --- /dev/null +++ b/annotations_filtered/k4YuBxpQwqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.02], [6.0, 6.74], [8.0, 12.73], [15.0, 18.93], [20.0, 23.04], [24.0, 28.0], [30.0, 31.23], [35.0, 35.8], [38.0, 39.68], [42.0, 43.95], [48.0, 52.35], [54.0, 57.28], [59.0, 61.38], [63.0, 65.91], [67.0, 69.85], [71.0, 73.36], [75.0, 76.77], [78.0, 79.84], [83.0, 83.81], [84.0, 83.86], [84.0, 83.93], [84.0, 84.0], [84.0, 85.89], [87.0, 87.39], [88.0, 91.93], [95.0, 96.75], [98.0, 100.57], [102.0, 112.16], [113.0, 116.14], [117.0, 120.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 100.0, 99.99, 85.35, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 93.13, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 0.74, 4.73, 3.93, 3.04, 4.0, 1.23, 0.8, 1.68, 1.95, 4.35, 3.28, 2.38, 2.91, 2.85, 2.36, 1.77, 1.84, 0.81, -0.14, -0.07, 0.0, 1.89, 0.39, 3.93, 1.75, 2.57, 10.16, 3.14, 3.14]} \ No newline at end of file diff --git a/annotations_filtered/k5bN73OnGmo_filtered.json b/annotations_filtered/k5bN73OnGmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0de2bc67e9122145eb02605e209d41e4950de5be --- /dev/null +++ b/annotations_filtered/k5bN73OnGmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.02], [14.0, 17.41], [18.0, 25.19], [27.0, 30.43], [31.0, 58.95], [60.0, 63.53]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 97.64, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.02, 3.41, 7.19, 3.43, 27.95, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/k5fJmkv02is_filtered.json b/annotations_filtered/k5fJmkv02is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef194f6d2dd80ef9c373063d01ed6c6c31f803ec --- /dev/null +++ b/annotations_filtered/k5fJmkv02is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [36.0, 36.27], [48.0, 48.66], [51.0, 53.59], [72.0, 71.66], [98.0, 100.16], [120.0, 123.74], [125.0, 128.9], [130.0, 130.49], [134.0, 134.64], [161.0, 160.73], [164.0, 165.05], [167.0, 167.98], [175.0, 177.77]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 43.74, 0.0, 45.36, 39.72, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81], "audiomae_on_audioset": [null, null, null, [["music", 41.01], ["throbbing", 13.01], ["hum", 11.07]], null, [["music", 40.95], ["throbbing", 18.64], ["hum", 10.01]], [["music", 35.12], ["throbbing", 17.14], ["hum", 14.33]], null, null, null, null, null, null, [["music", 30.08], ["throbbing", 27.05], ["hum", 7.1]]], "duration": [0.63, 0.27, 0.66, 2.59, -0.34, 2.16, 3.74, 3.9, 0.49, 0.64, -0.27, 1.05, 0.98, 2.77]} \ No newline at end of file diff --git a/annotations_filtered/k67i1cISzsI_filtered.json b/annotations_filtered/k67i1cISzsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba1569d9fa65ead4f6f9ca597e3f79c9badc9f94 --- /dev/null +++ b/annotations_filtered/k67i1cISzsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.82], [6.0, 7.74], [8.0, 13.85], [15.0, 17.41], [19.0, 19.77], [21.0, 23.09], [23.0, 24.46], [27.0, 28.92], [32.0, 35.65], [38.0, 40.05], [41.0, 41.88], [43.0, 46.21], [47.0, 48.98], [52.0, 65.3], [67.0, 74.38], [77.0, 86.46], [88.0, 89.46], [90.0, 121.53], [124.0, 129.22], [130.0, 135.73], [137.0, 138.1], [139.0, 141.17], [142.0, 165.79], [167.0, 169.37], [170.0, 171.1], [172.0, 172.34], [173.0, 174.58], [175.0, 183.69], [184.0, 184.76], [185.0, 184.99], [185.0, 185.09]], "keep_status": [false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.18, 0.0, 43.08, 43.56, 0.0, 38.36, 0.0, 0.0, 44.55, 45.62, 0.0, 43.82, 0.0, 38.9, 39.82, 38.71, 0.0, 0.0, 32.19, 35.29, 0.0, 54.83, 49.64, 34.46, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.85], ["throbbing", 11.82], ["bow-wow", 3.65]], null, [["hum", 35.8], ["music", 23.29], ["throbbing", 12.67]], [["music", 41.01], ["throbbing", 13.33], ["didgeridoo", 9.99]], null, [["music", 64.27], ["hum", 6.69], ["throbbing", 6.12]], null, null, [["music", 40.3], ["throbbing", 19.24], ["hum", 9.93]], [["music", 46.33], ["throbbing", 14.04], ["hum", 6.45]], null, [["music", 42.35], ["throbbing", 11.16], ["synthesizer", 10.68]], null, [["music", 44.4], ["throbbing", 14.44], ["hum", 11.94]], [["music", 45.76], ["didgeridoo", 13.93], ["throbbing", 13.54]], [["music", 68.88], ["didgeridoo", 14.59], ["throbbing", 2.93]], null, null, [["music", 33.76], ["didgeridoo", 23.33], ["hum", 11.7]], [["music", 34.2], ["didgeridoo", 11.76], ["hum", 10.98]], null, null, [["hum", 49.4], ["mains hum", 23.74], ["throbbing", 13.95]], [["speech", 54.17], ["fart", 22.87], ["inside, small room", 3.09]], null, null, null, null, null, null, null], "duration": [2.82, 1.74, 5.85, 2.41, 0.77, 2.09, 1.46, 1.92, 3.65, 2.05, 0.88, 3.21, 1.98, 13.3, 7.38, 9.46, 1.46, 31.53, 5.22, 5.73, 1.1, 2.17, 23.79, 2.37, 1.1, 0.34, 1.58, 8.69, 0.76, -0.01, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/k6TPsaQRQus_filtered.json b/annotations_filtered/k6TPsaQRQus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d5278a2e42f5d7d15958176ad9ea8fe728053c1 --- /dev/null +++ b/annotations_filtered/k6TPsaQRQus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [10.0, 10.05], [15.0, 16.55], [18.0, 20.41], [22.0, 23.25], [24.0, 26.37], [28.0, 31.75], [32.0, 32.76], [35.0, 36.76], [40.0, 41.69], [43.0, 43.71], [46.0, 46.95], [51.0, 51.76], [55.0, 55.59]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.04, 0.0, 35.94, 34.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.98], ["throbbing", 16.84], ["hum", 12.42]], null, [["music", 37.02], ["hum", 16.22], ["mains hum", 9.78]], [["mains hum", 15.86], ["didgeridoo", 13.59], ["music", 12.85]], null, null, null, null, null, null, null], "duration": [0.13, 0.05, 1.55, 2.41, 1.25, 2.37, 3.75, 0.76, 1.76, 1.69, 0.71, 0.95, 0.76, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/k6TUgccyzNs_filtered.json b/annotations_filtered/k6TUgccyzNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08f911ccf38b5297e69790f18a0a9a1b09a2b5d5 --- /dev/null +++ b/annotations_filtered/k6TUgccyzNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 54.53], [59.0, 77.16], [82.0, 98.91], [102.0, 105.85], [108.0, 120.11], [123.0, 140.76], [141.0, 163.24], [167.0, 167.71]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [32.89, 37.36, 39.08, 35.18, 36.77, 40.01, 42.62, 0.0], "audiomae_on_audioset": [[["music", 49.96], ["foghorn", 7.71], ["synthesizer", 5.31]], [["music", 64.34], ["trombone", 10.53], ["brass instrument", 6.69]], [["music", 68.32], ["trombone", 7.25], ["musical instrument", 5.7]], [["music", 47.08], ["trombone", 14.84], ["brass instrument", 13.39]], [["music", 45.39], ["trombone", 12.82], ["brass instrument", 11.5]], [["music", 72.89], ["theremin", 5.23], ["musical instrument", 3.23]], [["music", 55.67], ["trombone", 16.65], ["brass instrument", 12.18]], null], "duration": [14.53, 18.16, 16.91, 3.85, 12.11, 17.76, 22.24, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/k6YFnGzHfKk_filtered.json b/annotations_filtered/k6YFnGzHfKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c274d1d0324c31eca48f7a595da064ac7aa1905 --- /dev/null +++ b/annotations_filtered/k6YFnGzHfKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [12.0, 15.72], [18.0, 18.33], [19.0, 19.25], [22.0, 22.67], [24.0, 24.31], [25.0, 26.55], [27.0, 27.23], [28.0, 27.95], [29.0, 30.37], [31.0, 31.5], [33.0, 33.17], [35.0, 35.56], [37.0, 37.84], [43.0, 43.98], [55.0, 55.17], [56.0, 59.9], [63.0, 67.44], [68.0, 70.92], [73.0, 74.04], [74.0, 75.14], [76.0, 76.57], [79.0, 79.71], [81.0, 80.82], [81.0, 82.75], [85.0, 85.75], [86.0, 88.79], [95.0, 95.39], [99.0, 99.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 75.23, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 3.72, 0.33, 0.25, 0.67, 0.31, 1.55, 0.23, -0.05, 1.37, 0.5, 0.17, 0.56, 0.84, 0.98, 0.17, 3.9, 4.44, 2.92, 1.04, 1.14, 0.57, 0.71, -0.18, 1.75, 0.75, 2.79, 0.39, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/k6_TBuGcwzA_filtered.json b/annotations_filtered/k6_TBuGcwzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99df04d59303809c33b2b57d806748de3b76771c --- /dev/null +++ b/annotations_filtered/k6_TBuGcwzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 24.6], [28.0, 43.87], [44.0, 46.23], [49.0, 50.65], [52.0, 56.91], [57.0, 58.14], [59.0, 60.2], [61.0, 62.51], [64.0, 66.14], [69.0, 86.1], [88.0, 89.46], [91.0, 95.66], [96.0, 103.38], [104.0, 106.96], [109.0, 108.94], [112.0, 118.71], [119.0, 124.01], [126.0, 126.2], [127.0, 128.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.97, 99.73, 96.29, 0.0, 98.73, 0.0, 0.0, 0.0, 100.0, 98.8, 0.0, 55.74, 64.75, 84.43, 0.0, 99.68, 99.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.6, 15.87, 2.23, 1.65, 4.91, 1.14, 1.2, 1.51, 2.14, 17.1, 1.46, 4.66, 7.38, 2.96, -0.06, 6.71, 5.01, 0.2, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/k6_nTAS1M4M_filtered.json b/annotations_filtered/k6_nTAS1M4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae1be273659894eeae66c4ba84081d1ddc74bb04 --- /dev/null +++ b/annotations_filtered/k6_nTAS1M4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.05], [12.0, 13.46], [15.0, 16.58], [18.0, 20.07], [22.0, 22.71], [24.0, 25.03], [27.0, 27.78], [30.0, 31.94], [34.0, 35.09], [39.0, 56.49], [58.0, 59.21], [60.0, 61.57], [64.0, 65.89], [68.0, 68.64], [70.0, 71.46], [75.0, 77.41], [78.0, 81.7], [84.0, 85.29], [86.0, 88.62], [89.0, 91.4], [92.0, 93.6], [96.0, 100.45], [102.0, 105.75], [107.0, 109.04], [110.0, 115.08], [116.0, 118.86], [120.0, 125.66], [127.0, 128.01], [129.0, 131.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [100.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 92.31, 0.0, 90.43, 91.81, 0.0, 91.47, 46.43, 99.48, 99.84, 99.68, 97.73, 0.0, 45.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 25.71], ["moo", 21.82], ["livestock, farm animals, working animals", 20.61]], null, null, null, null, null, [["frog", 35.57], ["speech", 18.35], ["croak", 14.36]]], "duration": [5.05, 1.46, 1.58, 2.07, 0.71, 1.03, 0.78, 1.94, 1.09, 17.49, 1.21, 1.57, 1.89, 0.64, 1.46, 2.41, 3.7, 1.29, 2.62, 2.4, 1.6, 4.45, 3.75, 2.04, 5.08, 2.86, 5.66, 1.01, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/k6dRH6fO3Xw_filtered.json b/annotations_filtered/k6dRH6fO3Xw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a24d7c6573d0f7829f34fbddcbccb4b90179685 --- /dev/null +++ b/annotations_filtered/k6dRH6fO3Xw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 33.56], [34.0, 34.57], [35.0, 35.7], [37.0, 96.47], [98.0, 122.37], [125.0, 139.28]], "keep_status": [false, false, false, false, true, false], "silence_prob": [31.72, 0.0, 0.0, 0.0, 31.75, 31.72], "audiomae_on_audioset": [[["hum", 35.97], ["throbbing", 22.6], ["music", 16.54]], null, null, null, [["music", 16.5], ["vehicle", 14.14], ["race car, auto racing", 13.77]], [["speech", 50.34], ["buzz", 12.47], ["vehicle", 8.93]]], "duration": [24.56, 0.57, 0.7, 59.47, 24.37, 14.28]} \ No newline at end of file diff --git a/annotations_filtered/k6eXuHmQoiM_filtered.json b/annotations_filtered/k6eXuHmQoiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/k6eXuHmQoiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/k6u3YvvvgjQ_filtered.json b/annotations_filtered/k6u3YvvvgjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dff6ad67a8f91fe81867e6673b7a342350f5ce7b --- /dev/null +++ b/annotations_filtered/k6u3YvvvgjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [7.0, 8.19], [12.0, 12.18], [13.0, 13.42], [19.0, 19.87], [28.0, 31.48], [33.0, 34.13], [35.0, 36.69], [37.0, 38.92], [42.0, 47.12], [49.0, 61.35], [62.0, 64.57], [65.0, 66.97], [68.0, 68.62], [70.0, 70.48], [71.0, 73.21], [75.0, 75.73], [77.0, 77.84], [79.0, 80.42], [81.0, 81.6], [83.0, 86.09], [88.0, 90.51], [91.0, 91.81], [93.0, 94.44], [95.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.48, 84.62, 53.22, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 46.43, 38.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.21], ["thunk", 12.7], ["hum", 8.89]], [["music", 50.57], ["theremin", 15.41], ["walk, footsteps", 2.07]], null, null, null], "duration": [1.31, 1.19, 0.18, 0.42, 0.87, 3.48, 1.13, 1.69, 1.92, 5.12, 12.35, 2.57, 1.97, 0.62, 0.48, 2.21, 0.73, 0.84, 1.42, 0.6, 3.09, 2.51, 0.81, 1.44, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/k79KJYXrBkc_filtered.json b/annotations_filtered/k79KJYXrBkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98fcd1f9639fe492d66ab03dd4c82a881d85a014 --- /dev/null +++ b/annotations_filtered/k79KJYXrBkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [10.0, 10.47], [11.0, 12.01], [17.0, 17.68], [22.0, 22.18], [33.0, 33.24], [42.0, 42.4], [44.0, 44.71], [46.0, 46.06], [49.0, 49.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 0.47, 1.01, 0.68, 0.18, 0.24, 0.4, 0.71, 0.06, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/k7WkN_gPNaM_filtered.json b/annotations_filtered/k7WkN_gPNaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd11e5ee7bde182910dabc210ea63f5a21c7dd59 --- /dev/null +++ b/annotations_filtered/k7WkN_gPNaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.05], [11.0, 10.99], [12.0, 13.34], [16.0, 16.6], [17.0, 17.58], [23.0, 23.68], [28.0, 29.15], [32.0, 32.98], [34.0, 36.36], [38.0, 39.51], [43.0, 44.37], [47.0, 48.17], [53.0, 59.31], [62.0, 62.58], [63.0, 64.1], [65.0, 65.16], [66.0, 66.56], [71.0, 72.62], [76.0, 77.68], [89.0, 88.96], [97.0, 97.83], [99.0, 100.6], [104.0, 105.38], [107.0, 107.76], [108.0, 110.12], [114.0, 114.91], [117.0, 118.07], [120.0, 120.85], [127.0, 128.21], [129.0, 130.71], [131.0, 132.51], [133.0, 133.49], [141.0, 141.93], [143.0, 144.56], [145.0, 146.23], [147.0, 148.96], [151.0, 151.71], [158.0, 157.81], [166.0, 170.31], [179.0, 179.56], [188.0, 190.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 41.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sidetone", 69.9], ["speech", 11.07], ["busy signal", 7.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.36], ["speech", 20.12], ["music", 7.57]]], "duration": [2.05, -0.01, 1.34, 0.6, 0.58, 0.68, 1.15, 0.98, 2.36, 1.51, 1.37, 1.17, 6.31, 0.58, 1.1, 0.16, 0.56, 1.62, 1.68, -0.04, 0.83, 1.6, 1.38, 0.76, 2.12, 0.91, 1.07, 0.85, 1.21, 1.71, 1.51, 0.49, 0.93, 1.56, 1.23, 1.96, 0.71, -0.19, 4.31, 0.56, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/k7_V-3ApEiM_filtered.json b/annotations_filtered/k7_V-3ApEiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aad4df210fd012a9831cf5b7b9b3db9efa588149 --- /dev/null +++ b/annotations_filtered/k7_V-3ApEiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.85], [7.0, 8.36], [9.0, 17.69], [19.0, 19.92], [21.0, 21.73], [23.0, 23.84], [26.0, 26.69], [30.0, 31.68], [32.0, 82.98], [85.0, 96.45], [98.0, 101.12], [102.0, 103.98], [105.0, 111.2], [112.0, 158.08]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.64, 51.99, 0.0, 30.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 35.65], ["music", 18.38], ["mains hum", 13.64]], null, null, [["hum", 26.91], ["music", 24.8], ["throbbing", 9.52]], null], "duration": [1.85, 1.36, 8.69, 0.92, 0.73, 0.84, 0.69, 1.68, 50.98, 11.45, 3.12, 1.98, 6.2, 46.08]} \ No newline at end of file diff --git a/annotations_filtered/k7ej9E5b8js_filtered.json b/annotations_filtered/k7ej9E5b8js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..323fdcaabd94651403f5d222eca6689a303a29a7 --- /dev/null +++ b/annotations_filtered/k7ej9E5b8js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.45], [20.0, 21.44], [22.0, 24.24], [25.0, 26.3], [27.0, 28.02], [30.0, 30.23], [31.0, 33.29], [34.0, 38.8], [41.0, 41.96], [43.0, 44.39], [46.0, 63.49], [64.0, 64.66], [69.0, 71.19], [73.0, 82.61], [83.0, 102.42], [103.0, 104.31], [105.0, 116.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 53.34, 0.0, 0.0, 0.0, 49.78, 41.76, 0.0, 0.0, 38.19, 0.0, 76.37, 36.9, 34.25, 0.0, 36.45], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 51.92], ["whale vocalization", 11.05], ["mains hum", 7.98]], [["hum", 55.87], ["mains hum", 24.74], ["throbbing", 11.41]], null, null, [["hum", 29.3], ["mains hum", 23.31], ["speech", 7.82]], null, null, [["hum", 34.12], ["mains hum", 18.14], ["throbbing", 7.54]], [["hum", 39.81], ["throbbing", 21.93], ["mains hum", 13.27]], null, [["throbbing", 47.18], ["hum", 27.8], ["heart sounds, heartbeat", 5.08]]], "duration": [1.45, 1.44, 2.24, 1.3, 1.02, 0.23, 2.29, 4.8, 0.96, 1.39, 17.49, 0.66, 2.19, 9.61, 19.42, 1.31, 11.58]} \ No newline at end of file diff --git a/annotations_filtered/k7o8U7h_YHM_filtered.json b/annotations_filtered/k7o8U7h_YHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b0ae2a0a0f41f514008a4deb9ddc1cb5de105fa --- /dev/null +++ b/annotations_filtered/k7o8U7h_YHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [29.0, 29.51], [42.0, 42.62], [50.0, 51.43], [59.0, 60.07]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.61, 0.51, 0.62, 1.43, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/k87Hk4JNqGY_filtered.json b/annotations_filtered/k87Hk4JNqGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfddf2918c8cad6c4bfe2b30a95090ed8d9e5a76 --- /dev/null +++ b/annotations_filtered/k87Hk4JNqGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.67], [9.0, 10.69], [11.0, 16.12], [17.0, 17.56], [22.0, 23.09], [24.0, 33.54], [34.0, 38.33], [45.0, 45.08], [47.0, 48.57], [56.0, 57.7], [64.0, 64.99], [67.0, 67.66], [71.0, 72.5], [75.0, 75.61], [82.0, 82.27], [84.0, 85.62], [87.0, 88.33], [89.0, 90.8], [93.0, 94.95], [105.0, 107.37], [114.0, 115.38], [117.0, 117.85], [124.0, 125.73], [128.0, 129.42], [130.0, 130.98], [131.0, 133.62], [134.0, 134.59], [146.0, 148.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 100.0, 0.0, 0.0, 99.9, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 83.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.67, 1.69, 5.12, 0.56, 1.09, 9.54, 4.33, 0.08, 1.57, 1.7, 0.99, 0.66, 1.5, 0.61, 0.27, 1.62, 1.33, 1.8, 1.95, 2.37, 1.38, 0.85, 1.73, 1.42, 0.98, 2.62, 0.59, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/k8Do9tamQSM_filtered.json b/annotations_filtered/k8Do9tamQSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e6cbbc9ecfb2faa8551fa82db35b5d442a17f0e --- /dev/null +++ b/annotations_filtered/k8Do9tamQSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.32], [13.0, 13.37], [17.0, 19.41], [24.0, 24.97], [29.0, 38.16], [43.0, 45.71], [49.0, 57.87], [75.0, 80.62], [82.0, 83.0], [85.0, 85.06], [95.0, 98.9], [102.0, 102.59], [144.0, 146.03], [149.0, 149.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.98, 0.0, 99.26, 0.0, 64.29, 40.9, 87.0, 52.98, 0.0, 0.0, 41.81, 0.0, 99.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 62.56], ["singing bowl", 4.84], ["ambient music", 4.09]], null, null, null, null, [["speech", 27.88], ["baby laughter", 14.46], ["laughter", 8.55]], null, null, null], "duration": [3.32, 0.37, 2.41, 0.97, 9.16, 2.71, 8.87, 5.62, 1.0, 0.06, 3.9, 0.59, 2.03, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/k8Vn9zLollY_filtered.json b/annotations_filtered/k8Vn9zLollY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/k8Vn9zLollY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/k8VqG4ftlK0_filtered.json b/annotations_filtered/k8VqG4ftlK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..099adda07563f8cbacf5c42ad94e94975daa2fd0 --- /dev/null +++ b/annotations_filtered/k8VqG4ftlK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.42], [36.0, 39.82], [46.0, 47.19], [54.0, 56.13], [56.0, 59.26], [59.0, 62.7], [63.0, 63.36], [65.0, 67.51], [69.0, 76.28], [77.0, 80.96], [82.0, 95.52], [103.0, 104.16], [106.0, 107.79], [109.0, 110.32], [112.0, 112.29], [114.0, 114.15], [115.0, 116.24], [122.0, 122.59], [127.0, 128.34], [130.0, 131.6], [134.0, 135.65], [137.0, 138.1]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.91, 0.0, 98.01, 83.52, 59.68, 0.0, 54.3, 36.53, 99.56, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.34], ["singing bowl", 17.57], ["hum", 10.94]], null, null, null, null, null, null, [["speech", 23.92], ["mains hum", 18.76], ["music", 14.22]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 3.82, 1.19, 2.13, 3.26, 3.7, 0.36, 2.51, 7.28, 3.96, 13.52, 1.16, 1.79, 1.32, 0.29, 0.15, 1.24, 0.59, 1.34, 1.6, 1.65, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/k8bJrJ7_LKI_filtered.json b/annotations_filtered/k8bJrJ7_LKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5176d384b94693a21bc49b43ed934099979397f8 --- /dev/null +++ b/annotations_filtered/k8bJrJ7_LKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.15], [13.0, 24.33], [36.0, 36.66], [39.0, 39.31], [58.0, 58.73], [59.0, 60.12], [62.0, 65.18], [66.0, 66.92], [71.0, 73.58], [75.0, 75.2], [77.0, 77.45], [79.0, 78.7], [79.0, 79.98], [83.0, 83.1], [91.0, 91.25], [94.0, 94.58], [98.0, 98.58], [99.0, 99.98], [100.0, 101.49], [106.0, 105.71], [106.0, 107.64], [109.0, 109.14], [111.0, 110.89], [111.0, 111.4], [113.0, 113.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.55, 53.78, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 11.33, 0.66, 0.31, 0.73, 1.12, 3.18, 0.92, 2.58, 0.2, 0.45, -0.3, 0.98, 0.1, 0.25, 0.58, 0.58, 0.98, 1.49, -0.29, 1.64, 0.14, -0.11, 0.4, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/k8oFMkg7icg_filtered.json b/annotations_filtered/k8oFMkg7icg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df3757c43e57e4ab40d46593f5546e44e279e5ac --- /dev/null +++ b/annotations_filtered/k8oFMkg7icg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [6.0, 21.83], [23.0, 46.43], [51.0, 54.94], [59.0, 59.49], [63.0, 71.63], [78.0, 78.78], [81.0, 82.0], [83.0, 86.02], [87.0, 87.72], [91.0, 101.39], [105.0, 115.94]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 31.4, 30.52, 31.29, 0.0, 31.44, 0.0, 0.0, 33.8, 0.0, 29.77, 31.85], "audiomae_on_audioset": [null, [["music", 69.92], ["effects unit", 6.37], ["musical instrument", 6.3]], [["music", 57.0], ["didgeridoo", 20.16], ["musical instrument", 8.98]], [["music", 39.65], ["trombone", 17.97], ["brass instrument", 15.19]], null, [["music", 73.42], ["theremin", 10.9], ["musical instrument", 5.86]], null, null, [["music", 27.61], ["theremin", 16.8], ["whale vocalization", 12.03]], null, [["music", 31.87], ["brass instrument", 25.54], ["trombone", 15.94]], [["music", 43.22], ["theremin", 20.37], ["musical instrument", 7.76]]], "duration": [0.86, 15.83, 23.43, 3.94, 0.49, 8.63, 0.78, 1.0, 3.02, 0.72, 10.39, 10.94]} \ No newline at end of file diff --git a/annotations_filtered/k8zDVhc4XPs_filtered.json b/annotations_filtered/k8zDVhc4XPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54999e2aa72d20cf8e0cfa87dac3192dc0b19bec --- /dev/null +++ b/annotations_filtered/k8zDVhc4XPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.55], [19.0, 24.87], [29.0, 47.12], [48.0, 49.44], [51.0, 84.03], [85.0, 88.92], [89.0, 111.45], [115.0, 115.79], [118.0, 117.85], [118.0, 123.99]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 50.46, 67.63, 0.0, 0.0, 66.27, 42.62, 0.0, 0.0, 75.07], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 33.34], ["music", 11.25], ["speech", 6.74]], null, null, null], "duration": [1.55, 5.87, 18.12, 1.44, 33.03, 3.92, 22.45, 0.79, -0.15, 5.99]} \ No newline at end of file diff --git a/annotations_filtered/k96h1dYQrj0_filtered.json b/annotations_filtered/k96h1dYQrj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a04bcef27d1c4be57b9f7171d3ffe556dc0032 --- /dev/null +++ b/annotations_filtered/k96h1dYQrj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.66], [13.0, 18.64], [21.0, 22.13], [24.0, 25.32], [31.0, 31.4], [33.0, 32.95], [34.0, 34.35], [38.0, 37.94], [39.0, 39.29], [41.0, 41.42], [53.0, 54.09], [58.0, 66.97], [72.0, 71.88], [75.0, 76.62], [77.0, 78.58], [80.0, 81.11], [82.0, 88.84], [89.0, 91.98], [93.0, 96.01], [97.0, 99.0], [100.0, 100.57], [102.0, 106.1], [107.0, 107.57], [108.0, 111.2], [113.0, 114.29], [116.0, 117.91], [120.0, 123.11], [125.0, 128.43], [129.0, 129.93], [130.0, 131.55], [137.0, 145.72], [146.0, 146.92], [149.0, 150.45], [152.0, 153.69], [158.0, 160.78]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.95, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 91.81, 77.03, 100.0, 43.69, 0.0, 35.59, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 42.35], "audiomae_on_audioset": [[["speech", 19.0], ["music", 14.63], ["cattle, bovinae", 8.48]], [["mosquito", 23.23], ["fly, housefly", 13.09], ["speech", 11.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.43], ["music", 3.06], ["inside, small room", 2.62]], null, [["speech", 27.96], ["baby laughter", 10.0], ["belly laugh", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.29], ["hum", 7.12], ["whale vocalization", 5.08]]], "duration": [9.66, 5.64, 1.13, 1.32, 0.4, -0.05, 0.35, -0.06, 0.29, 0.42, 1.09, 8.97, -0.12, 1.62, 1.58, 1.11, 6.84, 2.98, 3.01, 2.0, 0.57, 4.1, 0.57, 3.2, 1.29, 1.91, 3.11, 3.43, 0.93, 1.55, 8.72, 0.92, 1.45, 1.69, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/k9DO26O6dIg_filtered.json b/annotations_filtered/k9DO26O6dIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1191b4ee6f7935e1bff6782e3424be884dd90615 --- /dev/null +++ b/annotations_filtered/k9DO26O6dIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [3.0, 4.14], [5.0, 5.66], [11.0, 12.33], [15.0, 15.74], [19.0, 18.94], [24.0, 24.41], [26.0, 25.61], [30.0, 29.79], [32.0, 33.07], [39.0, 41.84], [49.0, 53.86], [55.0, 57.32], [62.0, 62.65], [81.0, 81.55], [83.0, 84.18], [90.0, 90.88], [93.0, 98.68], [102.0, 103.59], [106.0, 107.06], [110.0, 110.98], [120.0, 123.77], [127.0, 127.48], [135.0, 136.71], [137.0, 139.04], [140.0, 141.39], [143.0, 144.34], [146.0, 149.55], [151.0, 151.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 100.0, 98.99, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 32.21, 0.0, 0.0, 79.76, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 43.91], ["speech", 38.11], ["inside, small room", 2.11]], null, null, null, null, null, null, null], "duration": [0.7, 1.14, 0.66, 1.33, 0.74, -0.06, 0.41, -0.39, -0.21, 1.07, 2.84, 4.86, 2.32, 0.65, 0.55, 1.18, 0.88, 5.68, 1.59, 1.06, 0.98, 3.77, 0.48, 1.71, 2.04, 1.39, 1.34, 3.55, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/k9WhxTOA19s_filtered.json b/annotations_filtered/k9WhxTOA19s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5429068e572bd7d682f69f8c5e6f29fbe4c8d37 --- /dev/null +++ b/annotations_filtered/k9WhxTOA19s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.94], [13.0, 13.27], [14.0, 14.82], [17.0, 16.58], [17.0, 18.25], [19.0, 19.52], [20.0, 22.05], [25.0, 25.96], [35.0, 34.89], [36.0, 41.84], [44.0, 46.21], [48.0, 49.32], [51.0, 54.46], [56.0, 58.46], [59.0, 66.9], [68.0, 70.16], [72.0, 73.65], [75.0, 84.86], [87.0, 88.35], [90.0, 90.29], [91.0, 92.62], [96.0, 96.82], [98.0, 98.1], [99.0, 100.84], [106.0, 115.38], [117.0, 125.78], [127.0, 127.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 93.13, 92.15, 0.0, 87.74, 59.07, 84.25, 76.86, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 32.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.75], ["helicopter", 38.81], ["effects unit", 2.06]], null], "duration": [1.94, 0.27, 0.82, -0.42, 1.25, 0.52, 2.05, 0.96, -0.11, 5.84, 2.21, 1.32, 3.46, 2.46, 7.9, 2.16, 1.65, 9.86, 1.35, 0.29, 1.62, 0.82, 0.1, 1.84, 9.38, 8.78, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/k9gcqiIfw8E_filtered.json b/annotations_filtered/k9gcqiIfw8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4882a85eaef8369adab21e8a9ab5c4999705ef6f --- /dev/null +++ b/annotations_filtered/k9gcqiIfw8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 28.05], [36.0, 42.72], [44.0, 47.48], [49.0, 50.6], [52.0, 54.28], [60.0, 62.31], [63.0, 64.4], [66.0, 72.47]], "keep_status": [true, true, false, false, true, false, false, true], "silence_prob": [34.95, 35.94, 97.73, 0.0, 39.15, 35.94, 0.0, 35.4], "audiomae_on_audioset": [[["music", 46.1], ["race car, auto racing", 5.98], ["car", 4.69]], [["crowd", 19.49], ["vehicle", 11.32], ["cheering", 10.29]], null, null, [["music", 11.12], ["sound effect", 5.69], ["effects unit", 4.56]], [["speech", 80.94], ["crowd", 3.8], ["echo", 1.37]], null, [["speech", 23.65], ["music", 12.09], ["trombone", 11.33]]], "duration": [27.05, 6.72, 3.48, 1.6, 2.28, 2.31, 1.4, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/k9utcDoerr0_filtered.json b/annotations_filtered/k9utcDoerr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c51ed02f65ad8b3a56832c8b60ac5bd2935392c --- /dev/null +++ b/annotations_filtered/k9utcDoerr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.75], [12.0, 24.0], [28.0, 27.77], [28.0, 31.53], [34.0, 40.07], [46.0, 48.81], [49.0, 50.65], [54.0, 53.99], [58.0, 59.56], [61.0, 63.37], [67.0, 70.31], [71.0, 72.2], [75.0, 76.59], [77.0, 78.51], [81.0, 81.72], [84.0, 84.37], [88.0, 88.47], [90.0, 91.18], [92.0, 95.45], [97.0, 97.19], [99.0, 99.66], [101.0, 101.49], [102.0, 101.53], [103.0, 104.31], [107.0, 108.41], [111.0, 112.41], [113.0, 114.4], [120.0, 121.07], [126.0, 127.04], [129.0, 130.22], [135.0, 136.85], [141.0, 141.29], [143.0, 143.34], [147.0, 147.31], [151.0, 151.75], [153.0, 153.47], [155.0, 162.95], [164.0, 166.7], [169.0, 169.5], [172.0, 172.54], [179.0, 181.65]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 37.15, 0.0, 39.21, 99.62, 97.11, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.72, 33.03, 0.0, 0.0, 97.43], "audiomae_on_audioset": [null, [["frog", 23.67], ["animal", 9.65], ["livestock, farm animals, working animals", 6.99]], null, [["speech", 22.43], ["frog", 18.76], ["noise", 11.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.74], ["music", 5.52], ["hum", 5.26]], [["dog", 21.43], ["domestic animals, pets", 14.08], ["animal", 10.55]], null, null, null], "duration": [1.75, 12.0, -0.23, 3.53, 6.07, 2.81, 1.65, -0.01, 1.56, 2.37, 3.31, 1.2, 1.59, 1.51, 0.72, 0.37, 0.47, 1.18, 3.45, 0.19, 0.66, 0.49, -0.47, 1.31, 1.41, 1.41, 1.4, 1.07, 1.04, 1.22, 1.85, 0.29, 0.34, 0.31, 0.75, 0.47, 7.95, 2.7, 0.5, 0.54, 2.65]} \ No newline at end of file diff --git a/annotations_filtered/k9vHopyEtzs_filtered.json b/annotations_filtered/k9vHopyEtzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1355e050b30fafb4fe76eb23b8ca7ca43c19fba --- /dev/null +++ b/annotations_filtered/k9vHopyEtzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.76], [14.0, 14.67], [15.0, 16.07], [19.0, 19.85], [33.0, 33.47], [52.0, 52.56], [54.0, 78.46], [79.0, 91.23], [93.0, 117.49]], "keep_status": [false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 33.03, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 31.37], ["breaking", 15.19], ["smash, crash", 10.49]], [["music", 22.5], ["speech", 18.53], ["throbbing", 11.77]], null], "duration": [1.76, 0.67, 1.07, 0.85, 0.47, 0.56, 24.46, 12.23, 24.49]} \ No newline at end of file diff --git a/annotations_filtered/kA10xksmpCI_filtered.json b/annotations_filtered/kA10xksmpCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01eb153c0ab1124febace60d8648359deb845430 --- /dev/null +++ b/annotations_filtered/kA10xksmpCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [6.0, 6.57], [18.0, 20.48], [22.0, 23.92], [25.0, 25.07], [29.0, 30.48], [32.0, 33.13], [33.0, 35.16], [35.0, 37.91], [39.0, 41.37], [44.0, 46.84], [49.0, 50.21], [51.0, 51.8], [52.0, 55.02], [56.0, 58.14], [60.0, 61.86], [72.0, 72.91], [73.0, 74.24]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.2, 0.0, 0.0, 0.0, 0.0, 35.88, 38.66, 39.93, 43.74, 0.0, 0.0, 38.09, 37.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 77.67], ["synthesizer", 5.91], ["musical instrument", 3.8]], null, null, null, null, [["music", 45.39], ["mains hum", 10.68], ["hum", 8.14]], [["music", 45.83], ["synthesizer", 5.76], ["didgeridoo", 4.66]], [["music", 41.94], ["speech", 10.83], ["synthesizer", 8.57]], [["music", 41.24], ["musical instrument", 8.64], ["carnatic music", 7.2]], null, null, [["music", 53.48], ["musical instrument", 13.01], ["speech", 10.97]], [["music", 50.92], ["guitar", 7.83], ["musical instrument", 7.56]], null, null, null], "duration": [0.81, 0.57, 2.48, 1.92, 0.07, 1.48, 1.13, 2.16, 2.91, 2.37, 2.84, 1.21, 0.8, 3.02, 2.14, 1.86, 0.91, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/kARcfM_M6VE_filtered.json b/annotations_filtered/kARcfM_M6VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3102e6abb616fe264bd9a515e7163af9993ea2ed --- /dev/null +++ b/annotations_filtered/kARcfM_M6VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.77], [28.0, 28.36], [43.0, 43.01], [53.0, 55.29], [57.0, 58.73], [59.0, 60.78], [68.0, 68.62], [81.0, 85.75], [90.0, 90.88], [101.0, 101.75], [104.0, 105.36], [110.0, 110.17], [114.0, 113.95], [117.0, 117.1], [125.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [29.6, 0.0, 0.0, 28.65, 0.0, 0.0, 0.0, 29.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.64], "audiomae_on_audioset": [[["music", 58.75], ["didgeridoo", 17.94], ["musical instrument", 5.87]], null, null, [["throbbing", 31.13], ["hum", 29.33], ["music", 14.24]], null, null, null, [["music", 49.07], ["musical instrument", 8.4], ["synthesizer", 7.86]], null, null, null, null, null, null, [["sidetone", 29.94], ["hum", 21.43], ["mains hum", 18.46]]], "duration": [2.77, 0.36, 0.01, 2.29, 1.73, 1.78, 0.62, 4.75, 0.88, 0.75, 1.36, 0.17, -0.05, 0.1, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/kATiU-cZCPc_filtered.json b/annotations_filtered/kATiU-cZCPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8763ca9c1290579e5d9d89f20381a641c79309ff --- /dev/null +++ b/annotations_filtered/kATiU-cZCPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.78], [8.0, 11.04], [12.0, 12.85], [15.0, 16.63], [19.0, 19.16], [21.0, 23.77], [25.0, 25.52], [26.0, 25.73], [26.0, 25.76], [26.0, 26.55], [32.0, 33.39], [38.0, 38.69], [52.0, 53.52], [57.0, 58.6], [64.0, 65.33], [66.0, 66.24], [68.0, 68.81], [70.0, 71.19], [72.0, 72.45], [74.0, 75.0], [77.0, 78.0], [80.0, 80.79], [82.0, 82.26], [84.0, 83.86], [87.0, 87.78], [89.0, 90.05], [92.0, 92.67], [95.0, 97.12], [99.0, 100.58], [102.0, 102.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.1, 53.84, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.78, 3.04, 0.85, 1.63, 0.16, 2.77, 0.52, -0.27, -0.24, 0.55, 1.39, 0.69, 1.52, 1.6, 1.33, 0.24, 0.81, 1.19, 0.45, 1.0, 1.0, 0.79, 0.26, -0.14, 0.78, 1.05, 0.67, 2.12, 1.58, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/kA_BtqogJNk_filtered.json b/annotations_filtered/kA_BtqogJNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf1717a02024ec40fbfae21c4db042979c1240c --- /dev/null +++ b/annotations_filtered/kA_BtqogJNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.4], [8.0, 8.67], [10.0, 31.13], [32.0, 32.85], [34.0, 34.21], [35.0, 37.0], [38.0, 38.3], [41.0, 44.59], [46.0, 46.99], [48.0, 48.51], [52.0, 52.07], [53.0, 55.8], [57.0, 61.1], [66.0, 66.34], [70.0, 72.93], [75.0, 75.15], [77.0, 77.52], [81.0, 83.59], [84.0, 85.18], [86.0, 88.2], [90.0, 92.75], [95.0, 97.48], [98.0, 99.93], [101.0, 102.03], [109.0, 110.34], [113.0, 114.08], [116.0, 117.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.17, 0.0, 54.5, 0.0, 0.0, 72.46, 0.0, 81.71, 0.0, 0.0, 0.0, 75.55, 56.63, 0.0, 71.57, 0.0, 0.0, 75.72, 0.0, 67.76, 74.29, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.4, 0.67, 21.13, 0.85, 0.21, 2.0, 0.3, 3.59, 0.99, 0.51, 0.07, 2.8, 4.1, 0.34, 2.93, 0.15, 0.52, 2.59, 1.18, 2.2, 2.75, 2.48, 1.93, 1.03, 1.34, 1.08, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/kAd-K7nteyI_filtered.json b/annotations_filtered/kAd-K7nteyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a9b4128ade02e1b31c82c379cfbec12205e38d --- /dev/null +++ b/annotations_filtered/kAd-K7nteyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [26.0, 27.58], [31.0, 35.6], [45.0, 52.07], [53.0, 55.19], [59.0, 63.09], [65.0, 65.75], [67.0, 73.16], [77.0, 87.94], [89.0, 90.1], [93.0, 100.21], [104.0, 105.73], [106.0, 111.92], [113.0, 115.86], [117.0, 117.9], [118.0, 125.1], [125.0, 126.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.32, 30.06, 31.27, 29.71, 0.0, 30.59, 30.81, 0.0, 30.93, 0.0, 32.04, 30.78, 0.0, 30.05, 0.0], "audiomae_on_audioset": [null, null, [["music", 41.13], ["speech", 29.05], ["sidetone", 3.55]], [["hum", 43.67], ["mains hum", 27.42], ["throbbing", 19.16]], [["music", 40.85], ["throbbing", 22.42], ["hum", 7.58]], [["throbbing", 57.26], ["hum", 25.7], ["music", 7.96]], null, [["music", 45.48], ["speech", 21.75], ["throbbing", 14.8]], [["hum", 33.97], ["throbbing", 19.59], ["music", 19.45]], null, [["music", 44.27], ["throbbing", 15.59], ["hum", 13.22]], null, [["throbbing", 43.01], ["music", 20.65], ["hum", 14.66]], [["music", 47.32], ["speech", 9.04], ["throbbing", 6.18]], null, [["music", 65.07], ["throbbing", 7.62], ["hum", 4.24]], null], "duration": [0.93, 1.58, 4.6, 7.07, 2.19, 4.09, 0.75, 6.16, 10.94, 1.1, 7.21, 1.73, 5.92, 2.86, 0.9, 7.1, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/kAi0cSCUWfg_filtered.json b/annotations_filtered/kAi0cSCUWfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a3e6d524bdb4247424e8c22937861d2205072b0 --- /dev/null +++ b/annotations_filtered/kAi0cSCUWfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.22], [41.0, 41.1], [48.0, 47.55], [48.0, 48.15], [52.0, 52.24], [58.0, 62.18], [65.0, 68.62], [88.0, 89.24], [92.0, 92.72], [105.0, 106.44], [107.0, 117.1], [118.0, 118.02], [120.0, 120.01], [126.0, 126.42], [132.0, 132.9], [137.0, 137.98], [139.0, 140.73], [142.0, 142.18], [145.0, 148.49], [149.0, 149.42], [158.0, 158.73], [161.0, 162.13], [166.0, 166.92], [169.0, 169.4], [171.0, 175.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 32.07, 0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 0.0, 0.0, 0.0, 31.55], "audiomae_on_audioset": [null, null, null, null, null, [["radio", 52.44], ["speech", 21.07], ["sidetone", 6.26]], [["radio", 49.62], ["speech", 28.72], ["sidetone", 15.99]], null, null, null, [["didgeridoo", 52.77], ["music", 14.9], ["speech", 5.43]], null, null, null, null, null, null, null, [["sidetone", 60.45], ["radio", 27.47], ["speech", 7.13]], null, null, null, null, null, [["speech", 21.31], ["radio", 14.28], ["sidetone", 12.15]]], "duration": [0.22, 0.1, -0.45, 0.15, 0.24, 4.18, 3.62, 1.24, 0.72, 1.44, 10.1, 0.02, 0.01, 0.42, 0.9, 0.98, 1.73, 0.18, 3.49, 0.42, 0.73, 1.13, 0.92, 0.4, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/kAyPdsYr2K0_filtered.json b/annotations_filtered/kAyPdsYr2K0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..884269c06ddb206ffa12e7378384494b4a7f07a4 --- /dev/null +++ b/annotations_filtered/kAyPdsYr2K0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.63], [17.0, 29.89], [42.0, 45.33], [46.0, 60.35], [65.0, 84.37]], "keep_status": [false, true, false, false, false], "silence_prob": [42.48, 30.59, 40.04, 31.15, 29.14], "audiomae_on_audioset": [[["music", 63.88], ["didgeridoo", 8.46], ["hum", 5.48]], [["music", 15.17], ["fly, housefly", 11.97], ["buzz", 10.86]], [["music", 54.68], ["synthesizer", 8.52], ["throbbing", 8.28]], [["speech", 64.99], ["music", 16.87], ["animal", 9.6]], [["buzz", 36.64], ["music", 30.57], ["hum", 3.68]]], "duration": [10.63, 12.89, 3.33, 14.35, 19.37]} \ No newline at end of file diff --git a/annotations_filtered/kBEhz8vw2AM_filtered.json b/annotations_filtered/kBEhz8vw2AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a087d1d6e9107bba2c5cc96e6d06c7d282bc3449 --- /dev/null +++ b/annotations_filtered/kBEhz8vw2AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.28], [5.0, 5.46], [6.0, 6.62], [9.0, 9.39], [10.0, 10.45], [11.0, 11.37], [13.0, 13.34], [15.0, 15.21], [16.0, 17.49], [18.0, 18.89], [20.0, 20.22], [21.0, 27.26], [41.0, 41.61], [88.0, 88.62], [91.0, 91.32], [93.0, 93.56], [95.0, 95.22], [97.0, 97.33], [98.0, 98.68], [101.0, 101.06], [104.0, 104.58], [109.0, 109.81], [113.0, 115.59], [116.0, 118.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 87.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["stomach rumble", 9.39], ["hum", 7.35], ["insect", 7.05]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.46, 0.62, 0.39, 0.45, 0.37, 0.34, 0.21, 1.49, 0.89, 0.22, 6.26, 0.61, 0.62, 0.32, 0.56, 0.22, 0.33, 0.68, 0.06, 0.58, 0.81, 2.59, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/kBErrmmqnkI_filtered.json b/annotations_filtered/kBErrmmqnkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc7b8e9f07b7ca43e5dac68639387495b53d1198 --- /dev/null +++ b/annotations_filtered/kBErrmmqnkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 51.26], [52.0, 78.81], [83.0, 97.88], [105.0, 106.2], [114.0, 114.22], [118.0, 127.94], [131.0, 162.28], [165.0, 180.94], [182.0, 185.36], [189.0, 190.49], [193.0, 193.5], [194.0, 199.94], [200.0, 200.26], [201.0, 201.24], [203.0, 204.25]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [30.12, 30.1, 29.29, 0.0, 0.0, 29.25, 0.0, 29.19, 33.17, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.21], ["theremin", 7.94], ["musical instrument", 6.19]], [["music", 43.91], ["clarinet", 17.14], ["trombone", 14.0]], [["music", 19.99], ["boing", 10.47], ["cattle, bovinae", 9.42]], null, null, [["livestock, farm animals, working animals", 31.73], ["cattle, bovinae", 24.42], ["moo", 18.21]], null, [["music", 27.27], ["trombone", 15.39], ["brass instrument", 9.26]], [["speech", 66.24], ["whimper", 10.46], ["crying, sobbing", 6.09]], null, null, [["speech", 38.06], ["clip-clop", 10.01], ["horse", 8.01]], null, null, null], "duration": [22.26, 26.81, 14.88, 1.2, 0.22, 9.94, 31.28, 15.94, 3.36, 1.49, 0.5, 5.94, 0.26, 0.24, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/kBJDz4ylQO0_filtered.json b/annotations_filtered/kBJDz4ylQO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8313ce35260caaa0dc9975f1422ce1c329a7f8f0 --- /dev/null +++ b/annotations_filtered/kBJDz4ylQO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [6.0, 6.72], [27.0, 27.53], [33.0, 34.47], [43.0, 44.47], [47.0, 47.29], [49.0, 50.14], [51.0, 51.26], [53.0, 54.04], [55.0, 56.07], [58.0, 60.44], [63.0, 80.47], [83.0, 105.85], [111.0, 111.99], [112.0, 113.21], [114.0, 115.69], [128.0, 129.25], [130.0, 131.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.03, 30.32, 30.41, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 55.5], ["didgeridoo", 18.35], ["speech", 9.09]], [["music", 72.87], ["didgeridoo", 9.53], ["boing", 3.95]], [["music", 31.51], ["speech", 9.39], ["tubular bells", 5.3]], null, null, null, null, null], "duration": [0.91, 0.72, 0.53, 1.47, 1.47, 0.29, 1.14, 0.26, 1.04, 1.07, 2.44, 17.47, 22.85, 0.99, 1.21, 1.69, 1.25, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/kBTPEpA8BzU_filtered.json b/annotations_filtered/kBTPEpA8BzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab374097817636fc4e83f6fffb653179b6c4ebc --- /dev/null +++ b/annotations_filtered/kBTPEpA8BzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 78.39], [79.0, 79.12], [86.0, 93.16], [94.0, 103.72], [106.0, 162.35], [167.0, 168.24]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.83, 0.0, 29.84, 31.88, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 29.48], ["hum", 27.65], ["speech", 17.34]], null, [["speech", 62.22], ["explosion", 7.94], ["music", 4.17]], [["speech", 59.69], ["electric shaver, electric razor", 10.1], ["noise", 5.27]], null, null], "duration": [24.39, 0.12, 7.16, 9.72, 56.35, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/kBwVWrBk_uo_filtered.json b/annotations_filtered/kBwVWrBk_uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9efc0491713b8049a5b295426953256d967bcb98 --- /dev/null +++ b/annotations_filtered/kBwVWrBk_uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.93], [16.0, 19.33], [20.0, 20.83], [22.0, 25.78], [27.0, 28.83], [30.0, 32.43], [35.0, 36.61], [39.0, 39.56], [40.0, 41.99], [43.0, 44.98], [46.0, 54.51], [55.0, 57.37], [58.0, 59.43], [62.0, 64.3], [65.0, 66.19], [68.0, 69.67], [72.0, 73.63], [74.0, 85.55], [87.0, 92.26], [93.0, 100.74], [102.0, 103.2], [104.0, 104.65], [105.0, 104.85], [105.0, 104.89], [105.0, 104.92], [108.0, 113.19], [114.0, 116.01], [119.0, 175.31], [175.0, 194.22]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [65.55, 40.41, 0.0, 75.72, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 54.43, 78.55, 0.0, 48.91, 0.0, 0.0, 0.0, 43.96, 54.43, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 67.76, 0.0, 36.85], "audiomae_on_audioset": [null, [["music", 18.8], ["whale vocalization", 9.78], ["chime", 8.31]], null, null, null, null, null, null, null, null, null, null, null, [["chime", 21.17], ["wind chime", 16.96], ["glass", 8.32]], null, null, null, [["hum", 16.8], ["music", 16.11], ["speech", 15.41]], null, [["hum", 28.69], ["music", 25.35], ["mains hum", 10.66]], null, null, null, null, null, null, null, null, [["music", 43.71], ["singing bowl", 13.6], ["chirp tone", 5.68]]], "duration": [11.93, 3.33, 0.83, 3.78, 1.83, 2.43, 1.61, 0.56, 1.99, 1.98, 8.51, 2.37, 1.43, 2.3, 1.19, 1.67, 1.63, 11.55, 5.26, 7.74, 1.2, 0.65, -0.15, -0.11, -0.08, 5.19, 2.01, 56.31, 19.22]} \ No newline at end of file diff --git a/annotations_filtered/kC44tlr_KsU_filtered.json b/annotations_filtered/kC44tlr_KsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e1cb350ec633ba242215f6b00d05c0d587484b4 --- /dev/null +++ b/annotations_filtered/kC44tlr_KsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 26.6], [28.0, 34.42], [36.0, 38.03], [40.0, 40.9], [41.0, 46.21], [47.0, 51.24], [53.0, 53.57], [55.0, 55.16], [57.0, 57.97], [61.0, 71.1], [71.0, 93.68], [94.0, 96.03], [96.0, 97.11], [98.0, 143.14], [146.0, 151.51]], "keep_status": [true, false, false, false, true, true, false, false, false, false, true, true, false, false, false], "silence_prob": [34.27, 60.23, 72.9, 0.0, 49.68, 42.44, 0.0, 0.0, 0.0, 48.78, 30.79, 29.66, 0.0, 0.0, 95.78], "audiomae_on_audioset": [[["speech", 33.81], ["echo", 12.71], ["sound effect", 3.97]], null, null, null, [["effects unit", 23.37], ["music", 22.34], ["speech", 12.62]], [["music", 35.7], ["hum", 16.62], ["throbbing", 10.49]], null, null, null, [["music", 74.7], ["effects unit", 9.12], ["guitar", 3.86]], [["music", 59.65], ["fly, housefly", 5.25], ["throbbing", 4.11]], [["electric shaver, electric razor", 15.02], ["mains hum", 14.34], ["speech", 12.64]], null, null, null], "duration": [6.6, 6.42, 2.03, 0.9, 5.21, 4.24, 0.57, 0.16, 0.97, 10.1, 22.68, 2.03, 1.11, 45.14, 5.51]} \ No newline at end of file diff --git a/annotations_filtered/kCb1R69h92Q_filtered.json b/annotations_filtered/kCb1R69h92Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18cb8a685266613fd447b78f09465a72d875d71d --- /dev/null +++ b/annotations_filtered/kCb1R69h92Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 43.83], [45.0, 45.62], [47.0, 57.37], [58.0, 73.41], [74.0, 86.64], [89.0, 90.42], [94.0, 95.1], [100.0, 102.37], [104.0, 106.3], [110.0, 110.81], [111.0, 113.66], [117.0, 119.28], [121.0, 124.56], [126.0, 128.06], [131.0, 139.89], [141.0, 142.03], [143.0, 145.29], [146.0, 147.53], [149.0, 149.91], [151.0, 151.61], [155.0, 162.16], [163.0, 166.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.07, 89.36, 78.89, 0.0, 0.0, 98.93, 100.0, 0.0, 99.99, 99.52, 99.82, 36.9, 98.01, 0.0, 100.0, 0.0, 0.0, 0.0, 99.8, 99.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.42], ["music", 24.13], ["synthesizer", 4.41]], null, null, null, null, null, null, null, null], "duration": [42.83, 0.62, 10.37, 15.41, 12.64, 1.42, 1.1, 2.37, 2.3, 0.81, 2.66, 2.28, 3.56, 2.06, 8.89, 1.03, 2.29, 1.53, 0.91, 0.61, 7.16, 3.35]} \ No newline at end of file diff --git a/annotations_filtered/kCqEADYRg8g_filtered.json b/annotations_filtered/kCqEADYRg8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7a57c3cb07c577eb4953a0d5034cc59d2bd4451 --- /dev/null +++ b/annotations_filtered/kCqEADYRg8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.0], [24.0, 24.75], [27.0, 29.0], [30.0, 30.38], [33.0, 33.54], [36.0, 37.13], [41.0, 41.23], [49.0, 49.65], [55.0, 55.81], [57.0, 57.28], [69.0, 74.95], [77.0, 78.7], [80.0, 86.26], [88.0, 87.61], [92.0, 93.61], [95.0, 95.12], [98.0, 98.05], [106.0, 124.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 39.63, 0.0, 0.0, 0.0, 0.0, 40.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 43.64], ["speech", 38.24], ["inside, small room", 2.02]], null, [["music", 41.52], ["cattle, bovinae", 9.01], ["moo", 5.65]], null, null, null, null, [["speech", 55.89], ["music", 22.02], ["inside, small room", 2.41]]], "duration": [1.0, 0.75, 2.0, 0.38, 0.54, 1.13, 0.23, 0.65, 0.81, 0.28, 5.95, 1.7, 6.26, -0.39, 1.61, 0.12, 0.05, 18.51]} \ No newline at end of file diff --git a/annotations_filtered/kCrtP_gPMwk_filtered.json b/annotations_filtered/kCrtP_gPMwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501020f55a9e2dd35422d46643baff12848e363a --- /dev/null +++ b/annotations_filtered/kCrtP_gPMwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [3.0, 3.65], [4.0, 4.29], [5.0, 6.76], [7.0, 12.41], [15.0, 15.6], [17.0, 19.4], [21.0, 21.39], [22.0, 22.33], [23.0, 23.43], [24.0, 25.62], [29.0, 32.61], [33.0, 33.91], [38.0, 41.79], [42.0, 44.39], [45.0, 45.45], [48.0, 48.09], [50.0, 54.5], [65.0, 68.0], [69.0, 71.25], [74.0, 78.24], [79.0, 81.03], [85.0, 85.33], [89.0, 91.62], [94.0, 95.42], [97.0, 97.38], [98.0, 101.6], [107.0, 110.49], [114.0, 116.7], [118.0, 118.79], [121.0, 121.44], [123.0, 124.28], [126.0, 125.76], [130.0, 131.55], [138.0, 138.11], [140.0, 140.19], [147.0, 151.12], [151.0, 154.48], [158.0, 162.13], [162.0, 162.82], [164.0, 164.78], [169.0, 169.97], [181.0, 180.74], [191.0, 192.23], [194.0, 194.56], [195.0, 195.91], [196.0, 196.6], [202.0, 202.2], [203.0, 204.08], [212.0, 212.26], [214.0, 216.01], [216.0, 217.88], [222.0, 222.84], [229.0, 229.51], [230.0, 231.09], [231.0, 234.52], [235.0, 234.82], [237.0, 237.69], [240.0, 240.61], [244.0, 245.27], [245.0, 245.44], [250.0, 252.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 88.83, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 60.89, 52.51, 0.0, 0.0, 34.37, 99.92, 95.91, 40.66, 73.82, 0.0, 60.6, 0.0, 0.0, 36.11, 33.95, 39.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.74, 44.46, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.52], ["beatboxing", 6.13], ["laughter", 2.26]], null, null, [["howl", 29.99], ["animal", 12.13], ["domestic animals, pets", 10.04]], null, null, null, null, null, [["music", 33.58], ["clarinet", 13.47], ["wind instrument, woodwind instrument", 12.75]], [["music", 43.42], ["musical instrument", 11.0], ["wind instrument, woodwind instrument", 9.77]], [["music", 61.45], ["musical instrument", 7.12], ["whimper", 3.45]], null, null, null, null, null, null, null, [["thunk", 14.41], ["music", 10.26], ["speech", 7.91]], [["tuning fork", 34.44], ["speech", 32.29], ["sine wave", 10.76]], null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 40.09], ["bouncing", 8.89], ["music", 6.59]], null, null, null, null, [["speech", 36.75], ["whimper", 7.67], ["owl", 5.32]], null, null, null, null, null, null], "duration": [1.16, 0.65, 0.29, 1.76, 5.41, 0.6, 2.4, 0.39, 0.33, 0.43, 1.62, 3.61, 0.91, 3.79, 2.39, 0.45, 0.09, 4.5, 3.0, 2.25, 4.24, 2.03, 0.33, 2.62, 1.42, 0.38, 3.6, 3.49, 2.7, 0.79, 0.44, 1.28, -0.24, 1.55, 0.11, 0.19, 4.12, 3.48, 4.13, 0.82, 0.78, 0.97, -0.26, 1.23, 0.56, 0.91, 0.6, 0.2, 1.08, 0.26, 2.01, 1.88, 0.84, 0.51, 1.09, 3.52, -0.18, 0.69, 0.61, 1.27, 0.44, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/kCsm28_ULw4_filtered.json b/annotations_filtered/kCsm28_ULw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a96892735a8fc7afe178b6a00b90276d041e6c4b --- /dev/null +++ b/annotations_filtered/kCsm28_ULw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 48.1], [51.0, 52.32], [55.0, 56.98], [59.0, 59.05], [59.0, 59.51], [61.0, 66.48], [69.0, 70.12]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [17.1, 1.32, 1.98, 0.05, 0.51, 5.48, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/kCtsoBRr1Z0_filtered.json b/annotations_filtered/kCtsoBRr1Z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..425fca83b6366f4d147f96d43c80f296bbedd7ae --- /dev/null +++ b/annotations_filtered/kCtsoBRr1Z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [12.0, 12.72], [14.0, 13.74], [18.0, 21.0], [21.0, 21.86], [25.0, 35.09], [36.0, 36.41], [38.0, 39.26], [40.0, 42.45], [46.0, 46.99], [48.0, 49.42], [52.0, 52.93], [61.0, 61.28], [62.0, 62.75], [72.0, 75.63], [81.0, 81.36], [82.0, 83.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.81, 0.0, 64.63, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.72, -0.26, 3.0, 0.86, 10.09, 0.41, 1.26, 2.45, 0.99, 1.42, 0.93, 0.28, 0.75, 3.63, 0.36, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/kCxqmweKXZ0_filtered.json b/annotations_filtered/kCxqmweKXZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d49eb477d59f739c4d228e3562cbe3ec7baa5047 --- /dev/null +++ b/annotations_filtered/kCxqmweKXZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.76], [16.0, 29.52], [30.0, 30.75], [32.0, 34.62], [39.0, 40.34], [42.0, 45.01], [47.0, 47.7], [49.0, 50.82], [54.0, 57.25], [59.0, 61.52], [63.0, 62.94], [73.0, 73.87], [76.0, 94.56], [96.0, 96.42], [98.0, 98.04], [100.0, 140.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [29.98, 32.38, 0.0, 29.43, 0.0, 38.4, 0.0, 0.0, 30.49, 30.43, 0.0, 0.0, 29.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 32.26], ["mains hum", 25.16], ["electric shaver, electric razor", 14.82]], [["music", 48.35], ["throbbing", 19.65], ["hum", 16.66]], null, [["livestock, farm animals, working animals", 36.89], ["moo", 35.81], ["cattle, bovinae", 25.54]], null, [["hum", 65.74], ["throbbing", 12.68], ["mains hum", 12.01]], null, null, [["music", 22.84], ["hum", 12.47], ["mains hum", 10.01]], [["hum", 32.17], ["music", 18.71], ["mains hum", 14.46]], null, null, [["hum", 38.74], ["throbbing", 24.84], ["music", 16.58]], null, null, null], "duration": [7.76, 13.52, 0.75, 2.62, 1.34, 3.01, 0.7, 1.82, 3.25, 2.52, -0.06, 0.87, 18.56, 0.42, 0.04, 40.19]} \ No newline at end of file diff --git a/annotations_filtered/kD0zHgK3BJ8_filtered.json b/annotations_filtered/kD0zHgK3BJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bc71b96463b3d93d48570c65b37b3c779e34cbf --- /dev/null +++ b/annotations_filtered/kD0zHgK3BJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.75], [6.0, 10.77], [12.0, 12.9], [15.0, 18.76], [22.0, 22.33], [24.0, 24.36], [31.0, 31.06], [37.0, 38.35], [40.0, 41.25], [43.0, 43.53], [44.0, 49.35], [54.0, 57.06], [63.0, 64.07], [65.0, 66.31], [67.0, 67.64], [69.0, 69.52], [71.0, 71.46], [75.0, 75.25], [80.0, 80.43], [83.0, 83.37], [84.0, 84.94], [87.0, 87.86], [89.0, 89.4], [90.0, 92.8], [94.0, 94.88], [97.0, 98.17], [99.0, 99.72], [102.0, 105.43], [108.0, 108.97], [113.0, 115.43], [120.0, 122.1], [124.0, 129.27], [131.0, 131.89], [133.0, 135.82], [137.0, 144.61], [145.0, 145.88], [148.0, 149.61], [151.0, 151.48], [153.0, 154.33], [156.0, 157.3], [158.0, 160.41], [162.0, 163.34], [169.0, 175.32], [177.0, 179.07], [180.0, 182.21], [183.0, 183.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.09, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.64, 0.0, 0.0, 0.0, 96.42, 0.0, 82.79, 99.05, 78.04, 0.0, 90.43, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 76.86, 93.76, 87.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 36.48], ["mains hum", 13.63], ["throbbing", 10.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.75, 4.77, 0.9, 3.76, 0.33, 0.36, 0.06, 1.35, 1.25, 0.53, 5.35, 3.06, 1.07, 1.31, 0.64, 0.52, 0.46, 0.25, 0.43, 0.37, 0.94, 0.86, 0.4, 2.8, 0.88, 1.17, 0.72, 3.43, 0.97, 2.43, 2.1, 5.27, 0.89, 2.82, 7.61, 0.88, 1.61, 0.48, 1.33, 1.3, 2.41, 1.34, 6.32, 2.07, 2.21, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/kDDU-k-5v6s_filtered.json b/annotations_filtered/kDDU-k-5v6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07cbc9d44932cf66fc68abef344b6cd6ed45dfb1 --- /dev/null +++ b/annotations_filtered/kDDU-k-5v6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.0], [29.0, 29.29], [30.0, 32.09], [35.0, 36.64], [38.0, 50.41], [54.0, 77.94], [78.0, 103.03], [105.0, 105.21], [105.0, 108.46], [113.0, 115.18], [116.0, 118.5], [121.0, 121.09], [122.0, 122.27], [128.0, 128.65], [129.0, 135.31], [138.0, 148.83]], "keep_status": [false, false, true, false, true, true, true, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 33.14, 0.0, 28.88, 29.15, 29.35, 0.0, 29.32, 30.0, 32.76, 0.0, 0.0, 0.0, 29.86, 28.71], "audiomae_on_audioset": [null, null, [["music", 26.44], ["speech", 20.39], ["inside, small room", 4.16]], null, [["music", 43.15], ["speech", 3.45], ["animal", 3.1]], [["music", 44.82], ["buzz", 9.6], ["fly, housefly", 4.75]], [["music", 35.05], ["roaring cats (lions, tigers)", 8.34], ["animal", 7.4]], null, [["speech", 33.89], ["music", 25.6], ["electric shaver, electric razor", 15.66]], [["music", 40.41], ["fart", 5.86], ["fly, housefly", 4.06]], [["hum", 41.8], ["throbbing", 17.25], ["music", 14.55]], null, null, null, [["music", 23.81], ["speech", 20.92], ["mains hum", 14.55]], [["speech", 32.36], ["music", 13.49], ["vehicle", 8.68]]], "duration": [1.0, 0.29, 2.09, 1.64, 12.41, 23.94, 25.03, 0.21, 3.46, 2.18, 2.5, 0.09, 0.27, 0.65, 6.31, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/kDFwUhn_1Ao_filtered.json b/annotations_filtered/kDFwUhn_1Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc18f5dc24b2882ee1f9854941c4cbfe94f53ae4 --- /dev/null +++ b/annotations_filtered/kDFwUhn_1Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.56]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.56]} \ No newline at end of file diff --git a/annotations_filtered/kDSiyU72RpA_filtered.json b/annotations_filtered/kDSiyU72RpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f06761400f8a665b28a8be0f4069e0aeb63507d --- /dev/null +++ b/annotations_filtered/kDSiyU72RpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.95], [11.0, 11.8], [13.0, 17.71], [18.0, 19.11], [20.0, 21.25], [24.0, 24.44], [27.0, 27.62], [28.0, 29.49], [41.0, 41.25], [51.0, 55.11], [59.0, 59.17], [60.0, 60.57], [63.0, 62.92], [66.0, 66.73], [68.0, 68.84], [73.0, 73.03], [77.0, 76.84], [78.0, 78.48], [79.0, 79.95], [81.0, 81.11], [85.0, 85.72], [90.0, 91.05], [92.0, 92.35], [93.0, 102.03], [104.0, 109.54], [111.0, 112.02], [113.0, 117.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [87.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 35.94, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 14.38], ["wood", 13.74], ["splinter", 13.39]], null, null], "duration": [5.95, 0.8, 4.71, 1.11, 1.25, 0.44, 0.62, 1.49, 0.25, 4.11, 0.17, 0.57, -0.08, 0.73, 0.84, 0.03, -0.16, 0.48, 0.95, 0.11, 0.72, 1.05, 0.35, 9.03, 5.54, 1.02, 4.29]} \ No newline at end of file diff --git a/annotations_filtered/kDTjN5dVCzg_filtered.json b/annotations_filtered/kDTjN5dVCzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26482692417579631dd86d735cc4326802471183 --- /dev/null +++ b/annotations_filtered/kDTjN5dVCzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [15.0, 15.08], [20.0, 23.26], [41.0, 41.62], [47.0, 58.28], [82.0, 83.4], [87.0, 101.09], [102.0, 102.54], [104.0, 109.17], [118.0, 120.51], [121.0, 122.2], [124.0, 124.77]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 49.36, 0.0, 29.81, 0.0, 70.86, 0.0, 34.03, 99.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 82.69], ["sidetone", 2.24], ["music", 2.23]], null, [["throbbing", 34.24], ["music", 27.85], ["didgeridoo", 13.15]], null, null, null, [["speech", 53.34], ["arrow", 5.4], ["door", 3.35]], null, null, null], "duration": [0.38, 0.08, 3.26, 0.62, 11.28, 1.4, 14.09, 0.54, 5.17, 2.51, 1.2, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/kDeUWLhm-0g_filtered.json b/annotations_filtered/kDeUWLhm-0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39ccfb1f5884adbc750a694f90ff278c9fa406bd --- /dev/null +++ b/annotations_filtered/kDeUWLhm-0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.57], [3.0, 3.11], [9.0, 9.71], [12.0, 12.56], [15.0, 19.25], [21.0, 22.91], [27.0, 29.83], [31.0, 32.17], [33.0, 33.64], [48.0, 51.22], [56.0, 56.81], [68.0, 68.1], [77.0, 78.98], [81.0, 82.59], [88.0, 93.61], [96.0, 96.2], [110.0, 109.7], [115.0, 114.67], [122.0, 122.62]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.63, 0.0, 37.77, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 16.97], ["fly, housefly", 15.5], ["bee, wasp, etc.", 13.04]], null, [["honk", 15.62], ["animal", 14.32], ["goose", 14.14]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 0.11, 0.71, 0.56, 4.25, 1.91, 2.83, 1.17, 0.64, 3.22, 0.81, 0.1, 1.98, 1.59, 5.61, 0.2, -0.3, -0.33, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/kDfvxJUxL10_filtered.json b/annotations_filtered/kDfvxJUxL10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d90f4677b2dd411e8dc16a58adce6d774163a895 --- /dev/null +++ b/annotations_filtered/kDfvxJUxL10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 5.17], [6.0, 6.66], [12.0, 13.2], [24.0, 24.33], [26.0, 26.28], [32.0, 33.44], [40.0, 40.78], [55.0, 57.57], [58.0, 60.39], [65.0, 68.37], [72.0, 72.03], [73.0, 77.77], [99.0, 98.81], [105.0, 105.26], [111.0, 111.81], [119.0, 121.12], [125.0, 126.01], [127.0, 128.24], [133.0, 135.18], [139.0, 142.72], [143.0, 144.27], [144.0, 146.37], [149.0, 149.55], [150.0, 150.87], [153.0, 155.97], [160.0, 173.28], [174.0, 175.24], [178.0, 178.46], [181.0, 181.57], [184.0, 185.26], [186.0, 187.25], [188.0, 189.21], [190.0, 192.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.89, 50.21, 52.39, 0.0, 37.0, 0.0, 0.0, 0.0, 35.25, 0.0, 0.0, 54.63, 45.59, 0.0, 43.0, 0.0, 0.0, 56.25, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.62], ["mains hum", 31.16], ["throbbing", 9.16]], null, null, null, [["speech", 27.34], ["whale vocalization", 11.99], ["dial tone", 8.45]], null, null, null, [["hum", 32.55], ["throbbing", 20.51], ["mains hum", 9.04]], null, [["fart", 27.56], ["speech", 15.84], ["frog", 7.94]], null, null, null, [["speech", 35.92], ["fart", 13.56], ["hum", 7.12]], null, null, null, null, null, null, null], "duration": [0.6, 0.17, 0.66, 1.2, 0.33, 0.28, 1.44, 0.78, 2.57, 2.39, 3.37, 0.03, 4.77, -0.19, 0.26, 0.81, 2.12, 1.01, 1.24, 2.18, 3.72, 1.27, 2.37, 0.55, 0.87, 2.97, 13.28, 1.24, 0.46, 0.57, 1.26, 1.25, 1.21, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/kDnCoiYKmtw_filtered.json b/annotations_filtered/kDnCoiYKmtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7783521981eee29b056d169af4a8bc6b3df03d5c --- /dev/null +++ b/annotations_filtered/kDnCoiYKmtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [6.0, 5.73], [16.0, 17.02], [19.0, 19.11], [20.0, 20.34], [25.0, 26.64], [38.0, 38.43], [39.0, 39.85], [72.0, 73.01], [76.0, 76.86], [82.0, 98.59], [101.0, 102.09], [103.0, 104.13], [108.0, 109.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["throbbing", 49.17], ["hum", 34.06], ["mains hum", 7.38]], null, null, null], "duration": [0.51, -0.27, 1.02, 0.11, 0.34, 1.64, 0.43, 0.85, 1.01, 0.86, 16.59, 1.09, 1.13, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/kDtabTufxao_filtered.json b/annotations_filtered/kDtabTufxao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56d2261c1ea1a23fb85899a5efc9df2dd119c8b2 --- /dev/null +++ b/annotations_filtered/kDtabTufxao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [5.0, 9.48], [11.0, 10.69], [13.0, 13.73], [16.0, 16.09], [19.0, 20.63], [22.0, 22.06], [27.0, 27.33], [29.0, 31.36], [32.0, 33.08], [34.0, 34.69], [39.0, 40.42], [42.0, 43.01], [46.0, 48.17], [51.0, 51.51], [54.0, 55.21], [56.0, 61.92], [63.0, 64.84], [66.0, 66.11], [68.0, 68.54], [69.0, 86.49], [88.0, 89.56], [93.0, 99.39], [101.0, 101.26], [104.0, 105.14], [108.0, 115.08], [117.0, 119.43], [123.0, 124.11], [127.0, 128.28], [131.0, 133.34], [135.0, 135.3], [138.0, 139.11], [140.0, 144.0], [145.0, 146.84], [148.0, 150.79], [160.0, 162.99], [166.0, 179.85], [183.0, 190.43], [202.0, 208.45], [209.0, 210.81], [212.0, 217.09], [218.0, 223.1], [233.0, 233.49], [235.0, 235.08], [238.0, 238.2], [241.0, 241.15], [249.0, 252.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 42.86, 0.0, 0.0, 0.0, 43.0, 0.0, 99.97, 0.0, 0.0, 93.13, 100.0, 0.0, 0.0, 99.78, 0.0, 0.0, 99.1, 0.0, 97.33, 52.98, 43.03, 46.5, 44.34, 0.0, 44.78, 51.34, 0.0, 0.0, 0.0, 0.0, 46.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.88], ["didgeridoo", 8.22], ["boing", 7.37]], null, null, null, [["music", 58.32], ["brass instrument", 15.76], ["trombone", 6.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.23], ["boing", 17.11], ["effects unit", 8.67]], [["music", 70.69], ["didgeridoo", 13.11], ["boing", 2.86]], [["music", 70.3], ["didgeridoo", 4.2], ["brass instrument", 2.85]], null, [["music", 81.92], ["brass instrument", 6.02], ["musical instrument", 2.94]], null, null, null, null, null, [["music", 75.89], ["didgeridoo", 3.59], ["musical instrument", 2.81]]], "duration": [0.47, 4.48, -0.31, 0.73, 0.09, 1.63, 0.06, 0.33, 2.36, 1.08, 0.69, 1.42, 1.01, 2.17, 0.51, 1.21, 5.92, 1.84, 0.11, 0.54, 17.49, 1.56, 6.39, 0.26, 1.14, 7.08, 2.43, 1.11, 1.28, 2.34, 0.3, 1.11, 4.0, 1.84, 2.79, 2.99, 13.85, 7.43, 6.45, 1.81, 5.09, 5.1, 0.49, 0.08, 0.2, 0.15, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/kEL5reRoNk8_filtered.json b/annotations_filtered/kEL5reRoNk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa8eb6a137475bfacf4070887912b86a0d4ab12 --- /dev/null +++ b/annotations_filtered/kEL5reRoNk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.88], [18.0, 20.38], [22.0, 24.78], [26.0, 28.97], [31.0, 39.72], [53.0, 54.23], [56.0, 72.71]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 78.72, 74.44, 77.36, 52.68, 0.0, 30.84], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 28.81], ["livestock, farm animals, working animals", 24.34], ["moo", 23.84]]], "duration": [0.88, 2.38, 2.78, 2.97, 8.72, 1.23, 16.71]} \ No newline at end of file diff --git a/annotations_filtered/kELmSLtEiiI_filtered.json b/annotations_filtered/kELmSLtEiiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b6bf5e873d2c074c8a90c079cb7bf8f9535d63e --- /dev/null +++ b/annotations_filtered/kELmSLtEiiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.04], [14.0, 15.3], [16.0, 17.36], [19.0, 44.05], [44.0, 46.14], [51.0, 51.51], [53.0, 57.86], [58.0, 58.82], [59.0, 61.06], [64.0, 64.99], [66.0, 66.38], [67.0, 78.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.98, 0.0, 0.0, 47.39, 63.96, 0.0, 77.2, 0.0, 58.13, 0.0, 0.0, 42.67], "audiomae_on_audioset": [null, null, null, [["music", 54.59], ["theremin", 14.23], ["synthesizer", 3.84]], null, null, null, null, null, null, null, [["music", 62.42], ["synthesizer", 7.68], ["musical instrument", 4.9]]], "duration": [6.04, 1.3, 1.36, 25.05, 2.14, 0.51, 4.86, 0.82, 2.06, 0.99, 0.38, 11.95]} \ No newline at end of file diff --git a/annotations_filtered/kEnK0ZdMThc_filtered.json b/annotations_filtered/kEnK0ZdMThc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..682fb180f6a0aeff5687419940455ca345646680 --- /dev/null +++ b/annotations_filtered/kEnK0ZdMThc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 74.24], [76.0, 82.51], [85.0, 84.99], [86.0, 87.42], [88.0, 88.37], [91.0, 92.37], [93.0, 97.11], [102.0, 103.18], [105.0, 113.66], [116.0, 115.94], [120.0, 131.19], [133.0, 168.44], [169.0, 168.81], [169.0, 169.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.14, 35.62, 0.0, 0.0, 0.0, 0.0, 35.7, 0.0, 34.85, 0.0, 27.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.49], ["hum", 13.41], ["ambient music", 8.34]], [["throbbing", 31.3], ["hum", 23.67], ["music", 20.64]], null, null, null, null, [["music", 29.09], ["throbbing", 23.55], ["hum", 18.54]], null, [["throbbing", 37.46], ["music", 35.27], ["hum", 8.76]], null, [["eruption", 14.76], ["breaking", 12.17], ["smash, crash", 7.08]], null, null, null], "duration": [6.24, 6.51, -0.01, 1.42, 0.37, 1.37, 4.11, 1.18, 8.66, -0.06, 11.19, 35.44, -0.19, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/kEsfYG_bF-E_filtered.json b/annotations_filtered/kEsfYG_bF-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1095f10b78ed0386e456cb504582cf6cdd3aa3c3 --- /dev/null +++ b/annotations_filtered/kEsfYG_bF-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.5], [12.0, 12.23], [13.0, 13.07], [19.0, 20.11], [21.0, 21.1], [22.0, 22.77], [24.0, 25.27], [27.0, 28.24], [31.0, 32.66], [34.0, 33.72], [37.0, 37.86], [42.0, 43.26], [48.0, 48.29], [51.0, 51.04], [53.0, 57.52], [59.0, 59.9], [64.0, 64.69], [66.0, 67.32], [68.0, 83.83], [97.0, 97.51], [103.0, 105.6], [107.0, 108.8], [109.0, 117.14], [120.0, 120.45], [122.0, 123.48], [125.0, 126.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 0.0, 0.0, 0.0, 30.91, 0.0, 38.93, 0.0, 34.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.42], ["musical instrument", 8.5], ["synthesizer", 4.13]], null, null, null, [["music", 68.81], ["didgeridoo", 19.05], ["musical instrument", 6.16]], null, [["music", 54.16], ["theremin", 6.99], ["musical instrument", 4.3]], null, [["music", 64.35], ["synthesizer", 5.64], ["musical instrument", 4.81]], null, null, null], "duration": [0.5, 0.23, 0.07, 1.11, 0.1, 0.77, 1.27, 1.24, 1.66, -0.28, 0.86, 1.26, 0.29, 0.04, 4.52, 0.9, 0.69, 1.32, 15.83, 0.51, 2.6, 1.8, 8.14, 0.45, 1.48, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/kF-KLIi97Uc_filtered.json b/annotations_filtered/kF-KLIi97Uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90bff9ce570555b82d8d7d7a060573cb8ded4efb --- /dev/null +++ b/annotations_filtered/kF-KLIi97Uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [5.0, 5.1], [6.0, 7.92], [8.0, 8.45], [10.0, 10.66], [11.0, 11.75], [22.0, 22.15], [52.0, 57.92], [62.0, 61.64], [77.0, 78.19], [79.0, 80.43], [84.0, 85.58], [92.0, 92.72]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 43.54], ["speech", 11.46], ["effects unit", 6.39]], null, null, null, null, null], "duration": [0.0, 0.1, 1.92, 0.45, 0.66, 0.75, 0.15, 5.92, -0.36, 1.19, 1.43, 1.58, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/kFCUCnNKmmI_filtered.json b/annotations_filtered/kFCUCnNKmmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d61abc4b4a83e20fb4cc9420ada98f2fa67fe4b --- /dev/null +++ b/annotations_filtered/kFCUCnNKmmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [4.0, 4.65], [10.0, 11.1], [13.0, 15.65], [23.0, 23.41], [31.0, 34.64], [36.0, 36.81], [46.0, 48.09], [49.0, 52.34], [53.0, 53.89], [65.0, 65.77], [72.0, 72.84], [74.0, 74.6], [76.0, 76.74], [79.0, 79.81], [87.0, 87.72], [91.0, 92.04], [93.0, 99.84], [105.0, 106.46], [107.0, 109.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 80.29, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 74.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.65, 1.1, 2.65, 0.41, 3.64, 0.81, 2.09, 3.34, 0.89, 0.77, 0.84, 0.6, 0.74, 0.81, 0.72, 1.04, 6.84, 1.46, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/kFFuJQRlm38_filtered.json b/annotations_filtered/kFFuJQRlm38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b666f01bbbf12e3054eef41ae2cf5bec913c778 --- /dev/null +++ b/annotations_filtered/kFFuJQRlm38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [3.0, 5.53], [10.0, 10.83], [11.0, 11.87], [13.0, 13.26], [14.0, 14.71], [16.0, 17.42], [21.0, 22.52], [23.0, 33.83], [36.0, 36.15], [38.0, 38.48], [39.0, 40.66], [42.0, 43.11], [45.0, 45.59], [48.0, 48.24], [50.0, 50.8], [53.0, 53.72], [54.0, 55.0], [56.0, 56.83], [57.0, 59.81], [61.0, 63.09], [65.0, 65.75], [66.0, 67.42], [68.0, 68.49], [69.0, 70.24], [72.0, 71.95], [75.0, 76.82], [80.0, 80.65], [81.0, 82.68], [84.0, 85.33], [88.0, 88.15], [90.0, 90.24], [98.0, 97.73], [99.0, 99.69], [107.0, 107.77], [108.0, 108.57], [113.0, 115.62], [119.0, 120.68], [121.0, 125.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 2.53, 0.83, 0.87, 0.26, 0.71, 1.42, 1.52, 10.83, 0.15, 0.48, 1.66, 1.11, 0.59, 0.24, 0.8, 0.72, 1.0, 0.83, 2.81, 2.09, 0.75, 1.42, 0.49, 1.24, -0.05, 1.82, 0.65, 1.68, 1.33, 0.15, 0.24, -0.27, 0.69, 0.77, 0.57, 2.62, 1.68, 4.42]} \ No newline at end of file diff --git a/annotations_filtered/kFa1DI_4vEs_filtered.json b/annotations_filtered/kFa1DI_4vEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d002f42625e660595eb016689fb0e014bdddc00 --- /dev/null +++ b/annotations_filtered/kFa1DI_4vEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.59], [15.0, 26.11], [28.0, 27.99], [29.0, 51.95], [56.0, 57.45], [60.0, 61.01], [63.0, 64.07], [65.0, 68.77], [70.0, 86.97], [88.0, 92.5], [94.0, 95.66], [96.0, 102.22], [108.0, 119.69], [121.0, 124.39]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [77.2, 77.2, 0.0, 99.31, 0.0, 0.0, 0.0, 98.8, 43.25, 99.99, 0.0, 100.0, 94.52, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 52.63], ["sidetone", 5.82], ["music", 5.56]], null, null, null, null, null], "duration": [2.59, 11.11, -0.01, 22.95, 1.45, 1.01, 1.07, 3.77, 16.97, 4.5, 1.66, 6.22, 11.69, 3.39]} \ No newline at end of file diff --git a/annotations_filtered/kFbDy90VZQY_filtered.json b/annotations_filtered/kFbDy90VZQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c9af075d6c5fa557e0a465abfc7a24969a49f6 --- /dev/null +++ b/annotations_filtered/kFbDy90VZQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.94], [8.0, 8.83], [10.0, 9.85], [19.0, 20.02], [21.0, 22.2], [23.0, 38.42], [39.0, 46.99], [51.0, 53.99], [60.0, 62.45], [71.0, 77.5], [79.0, 78.87], [84.0, 88.53], [89.0, 100.04], [104.0, 105.56], [108.0, 109.26], [117.0, 118.32], [120.0, 123.38], [130.0, 132.73], [133.0, 133.47]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.08, 31.52, 33.61, 34.75, 29.68, 0.0, 30.3, 39.35, 0.0, 0.0, 0.0, 44.04, 43.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.93], ["speech", 15.72], ["buzz", 3.78]], [["music", 31.28], ["hum", 25.75], ["throbbing", 13.6]], [["music", 34.22], ["noise", 8.94], ["hum", 6.5]], [["music", 42.82], ["brass instrument", 8.63], ["trombone", 6.24]], [["music", 79.62], ["musical instrument", 4.22], ["foghorn", 2.22]], null, [["music", 50.5], ["didgeridoo", 14.47], ["pulse", 6.28]], [["music", 50.43], ["speech", 24.03], ["hum", 6.72]], null, null, null, [["music", 42.25], ["whale vocalization", 11.23], ["theremin", 6.07]], [["music", 49.09], ["hum", 7.15], ["ambient music", 4.7]], null], "duration": [0.94, 0.83, -0.15, 1.02, 1.2, 15.42, 7.99, 2.99, 2.45, 6.5, -0.13, 4.53, 11.04, 1.56, 1.26, 1.32, 3.38, 2.73, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/kFeduM49hBY_filtered.json b/annotations_filtered/kFeduM49hBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e585a0211eb4d31a7c41156e33e619d1a9233776 --- /dev/null +++ b/annotations_filtered/kFeduM49hBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [3.0, 6.3], [7.0, 7.52], [8.0, 8.45], [9.0, 24.53], [26.0, 26.49], [29.0, 95.72], [96.0, 95.77]], "keep_status": [false, true, false, false, true, false, false, false], "silence_prob": [0.0, 30.95, 0.0, 0.0, 29.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.76], ["buzz", 10.84], ["sound effect", 5.23]], null, null, [["speech", 47.21], ["buzz", 10.32], ["fly, housefly", 9.27]], null, null, null], "duration": [0.12, 3.3, 0.52, 0.45, 15.53, 0.49, 66.72, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/kFhDGoJh4O4_filtered.json b/annotations_filtered/kFhDGoJh4O4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b81dfd50631831245d9f390e09b28a732396df9a --- /dev/null +++ b/annotations_filtered/kFhDGoJh4O4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [7.0, 9.78], [11.0, 13.09], [15.0, 16.58], [19.0, 23.75], [25.0, 26.5], [28.0, 29.81], [32.0, 35.61], [37.0, 38.26], [39.0, 39.45], [41.0, 47.78], [51.0, 53.86], [54.0, 56.66], [59.0, 71.59], [72.0, 73.2], [74.0, 75.34], [77.0, 77.84], [78.0, 79.41], [81.0, 84.03], [85.0, 86.9], [88.0, 88.35], [90.0, 90.22], [91.0, 95.61], [97.0, 97.01], [98.0, 98.83], [99.0, 101.14], [102.0, 102.34], [103.0, 105.11], [108.0, 108.11], [111.0, 112.08], [113.0, 114.54], [115.0, 116.8], [120.0, 121.46], [125.0, 125.1], [125.0, 125.46], [127.0, 128.39], [131.0, 136.98], [139.0, 140.07], [141.0, 142.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 80.82, 0.0, 98.1, 0.0, 0.0, 98.36, 0.0, 0.0, 95.91, 99.44, 57.64, 99.1, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 38.33, 0.0, 0.0, 98.27, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.05], ["dial tone", 16.53], ["sine wave", 16.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 2.78, 2.09, 1.58, 4.75, 1.5, 1.81, 3.61, 1.26, 0.45, 6.78, 2.86, 2.66, 12.59, 1.2, 1.34, 0.84, 1.41, 3.03, 1.9, 0.35, 0.22, 4.61, 0.01, 0.83, 2.14, 0.34, 2.11, 0.11, 1.08, 1.54, 1.8, 1.46, 0.1, 0.46, 1.39, 5.98, 1.07, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/kFhIMrW1Yk4_filtered.json b/annotations_filtered/kFhIMrW1Yk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54a5b3d47598c1b2a5c12bc6f2d7f49b67b4d258 --- /dev/null +++ b/annotations_filtered/kFhIMrW1Yk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.97]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.97]} \ No newline at end of file diff --git a/annotations_filtered/kFuzbEylajA_filtered.json b/annotations_filtered/kFuzbEylajA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d736725f5741ba5396e622c66417748714734425 --- /dev/null +++ b/annotations_filtered/kFuzbEylajA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [30.0, 33.18], [38.0, 38.38], [39.0, 39.11], [41.0, 41.64], [49.0, 49.37], [53.0, 57.08], [60.0, 60.98], [64.0, 64.3], [66.0, 69.13], [84.0, 84.75], [85.0, 86.68], [92.0, 94.2], [98.0, 97.85], [105.0, 105.33], [115.0, 115.35]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 31.92, 0.0, 0.0, 34.63, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 48.78], ["boing", 9.18], ["musical instrument", 7.31]], null, null, [["music", 42.91], ["speech", 12.99], ["musical instrument", 2.79]], null, null, null, null, null, null], "duration": [0.15, 3.18, 0.38, 0.11, 0.64, 0.37, 4.08, 0.98, 0.3, 3.13, 0.75, 1.68, 2.2, -0.15, 0.33, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/kG8GuXOjIPA_filtered.json b/annotations_filtered/kG8GuXOjIPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..593b76ae1b7e9d0c5238ba0d97b79bd7f1a53c9a --- /dev/null +++ b/annotations_filtered/kG8GuXOjIPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.88], [38.0, 40.09], [46.0, 47.14], [49.0, 57.89], [60.0, 62.11], [63.0, 64.94], [68.0, 76.45], [82.0, 87.98]], "keep_status": [false, false, false, false, true, false, true, true], "silence_prob": [0.0, 85.35, 0.0, 29.92, 45.08, 0.0, 28.07, 30.25], "audiomae_on_audioset": [null, null, null, [["explosion", 68.14], ["burst, pop", 14.72], ["speech", 4.17]], [["grunt", 12.69], ["animal", 7.95], ["roaring cats (lions, tigers)", 5.29]], null, [["music", 15.73], ["buzz", 6.87], ["rumble", 6.55]], [["explosion", 26.77], ["music", 14.28], ["hum", 9.55]]], "duration": [0.88, 2.09, 1.14, 8.89, 2.11, 1.94, 8.45, 5.98]} \ No newline at end of file diff --git a/annotations_filtered/kGVQE0m_V3A_filtered.json b/annotations_filtered/kGVQE0m_V3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e36c6b3e73069cc0309ce060a5dab98d4ec72224 --- /dev/null +++ b/annotations_filtered/kGVQE0m_V3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 22.33], [24.0, 47.44], [48.0, 49.79], [51.0, 51.34], [52.0, 53.13], [55.0, 57.4], [59.0, 61.67], [63.0, 64.02], [67.0, 69.15], [72.0, 72.64], [73.0, 75.12], [77.0, 77.45], [80.0, 81.19], [82.0, 83.69], [85.0, 85.24], [87.0, 87.61], [90.0, 89.94], [91.0, 91.71], [93.0, 92.75], [93.0, 93.95], [95.0, 94.93], [95.0, 95.44], [97.0, 97.39], [98.0, 101.68], [103.0, 105.66], [107.0, 108.63], [109.0, 109.38], [111.0, 111.75], [113.0, 113.76]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.89, 29.03, 0.0, 0.0, 0.0, 80.82, 100.0, 0.0, 97.0, 0.0, 32.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 99.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.25], ["hum", 11.82], ["throbbing", 8.0]], [["music", 46.45], ["speech", 38.78], ["firecracker", 1.61]], null, null, null, null, null, null, null, null, [["whale vocalization", 68.19], ["noise", 4.03], ["stomach rumble", 2.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.33, 23.44, 1.79, 0.34, 1.13, 2.4, 2.67, 1.02, 2.15, 0.64, 2.12, 0.45, 1.19, 1.69, 0.24, 0.61, -0.06, 0.71, -0.25, 0.95, -0.07, 0.44, 0.39, 3.68, 2.66, 1.63, 0.38, 0.75, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/kGViaTOfSow_filtered.json b/annotations_filtered/kGViaTOfSow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..052793545e1341cd0c299a577358bac7d6dee1c2 --- /dev/null +++ b/annotations_filtered/kGViaTOfSow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [16.0, 22.62], [28.0, 28.76], [30.0, 34.4], [36.0, 37.59], [38.0, 42.11], [46.0, 46.31], [50.0, 50.55], [62.0, 62.09], [65.0, 66.07], [68.0, 68.88], [71.0, 71.47], [77.0, 77.5], [82.0, 82.34], [86.0, 86.86], [93.0, 94.73], [100.0, 100.18], [102.0, 103.65], [106.0, 106.56], [109.0, 110.29], [112.0, 111.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.68, 0.0, 30.76, 0.0, 31.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 69.08], ["throbbing", 5.99], ["didgeridoo", 5.72]], null, [["music", 64.53], ["singing", 3.17], ["musical instrument", 2.35]], null, [["music", 69.11], ["musical instrument", 2.72], ["psychedelic rock", 1.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 6.62, 0.76, 4.4, 1.59, 4.11, 0.31, 0.55, 0.09, 1.07, 0.88, 0.47, 0.5, 0.34, 0.86, 1.73, 0.18, 1.65, 0.56, 1.29, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/kGot2YelCpE_filtered.json b/annotations_filtered/kGot2YelCpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19c5b5c714f8a1b14650f5fb92042c5472469865 --- /dev/null +++ b/annotations_filtered/kGot2YelCpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [11.0, 11.37], [16.0, 17.81], [40.0, 50.01], [59.0, 61.42], [61.0, 61.47], [61.0, 61.5], [62.0, 64.25], [79.0, 87.29], [89.0, 89.45], [90.0, 89.55], [90.0, 89.58], [90.0, 89.61], [90.0, 92.87], [96.0, 111.15], [113.0, 113.0], [113.0, 123.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.4, 35.28, 0.0, 0.0, 37.08, 34.47, 0.0, 0.0, 0.0, 0.0, 33.46, 35.54, 0.0, 32.69], "audiomae_on_audioset": [null, null, null, [["music", 68.96], ["electronic music", 8.77], ["speech", 4.98]], [["music", 54.08], ["speech", 11.1], ["sidetone", 8.05]], null, null, [["music", 32.04], ["speech", 21.78], ["sidetone", 21.77]], [["music", 57.21], ["speech", 16.24], ["electronic music", 8.19]], null, null, null, null, [["music", 43.57], ["speech", 19.52], ["sidetone", 7.32]], [["music", 56.05], ["speech", 9.34], ["electronic music", 8.18]], null, [["cattle, bovinae", 34.11], ["moo", 30.28], ["livestock, farm animals, working animals", 15.25]]], "duration": [0.43, 0.37, 1.81, 10.01, 2.42, 0.47, 0.5, 2.25, 8.29, 0.45, -0.45, -0.42, -0.39, 2.87, 15.15, 0.0, 10.35]} \ No newline at end of file diff --git a/annotations_filtered/kGpNxt3bD6E_filtered.json b/annotations_filtered/kGpNxt3bD6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fa428c1e7a121cd456beb50983356fcd71309d3 --- /dev/null +++ b/annotations_filtered/kGpNxt3bD6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.1], [11.0, 11.5], [17.0, 17.66], [32.0, 33.07], [34.0, 35.94], [40.0, 43.34], [49.0, 49.2], [50.0, 63.61], [64.0, 65.03]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.05, 0.0, 30.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.41], ["speech", 15.4], ["didgeridoo", 9.53]], null, [["music", 76.04], ["animal", 2.39], ["moo", 1.63]], null], "duration": [0.1, 0.5, 0.66, 1.07, 1.94, 3.34, 0.2, 13.61, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/kH6SUxCwXzs_filtered.json b/annotations_filtered/kH6SUxCwXzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa98b65023680b8c2a9571414fef8aa713c04120 --- /dev/null +++ b/annotations_filtered/kH6SUxCwXzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.88], [5.0, 6.93], [11.0, 10.98], [17.0, 20.71], [26.0, 26.92], [27.0, 28.34], [34.0, 34.47], [37.0, 37.5], [38.0, 39.18], [41.0, 44.54], [47.0, 48.15], [50.0, 51.09], [54.0, 58.82], [61.0, 65.72], [67.0, 67.15], [70.0, 70.23], [71.0, 72.4], [76.0, 76.74], [94.0, 96.47], [97.0, 98.79], [101.0, 101.04], [109.0, 109.66], [111.0, 111.42], [112.0, 114.4], [116.0, 117.04], [118.0, 118.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 97.92, 99.4, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 1.93, -0.02, 3.71, 0.92, 1.34, 0.47, 0.5, 1.18, 3.54, 1.15, 1.09, 4.82, 4.72, 0.15, 0.23, 1.4, 0.74, 2.47, 1.79, 0.04, 0.66, 0.42, 2.4, 1.04, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/kHQq6ri9MDI_filtered.json b/annotations_filtered/kHQq6ri9MDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e59d2df508d8e4dd0059a71e1d4499d78020ba --- /dev/null +++ b/annotations_filtered/kHQq6ri9MDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.94], [15.0, 16.63], [18.0, 19.52], [20.0, 21.37], [23.0, 31.02], [32.0, 33.42], [34.0, 36.17], [37.0, 100.06], [102.0, 112.11], [113.0, 115.32], [117.0, 129.44], [132.0, 133.74], [135.0, 136.43], [138.0, 139.83], [141.0, 143.88], [146.0, 145.77]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 55.89, 0.0, 28.74, 35.96, 31.14, 0.0, 0.0, 0.0, 69.07, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 69.9], ["hum", 5.24], ["ambient music", 2.88]], null, null, null, [["clang", 18.59], ["music", 17.56], ["ding", 13.24]], [["chirp tone", 20.62], ["speech", 14.16], ["music", 9.41]], [["music", 30.17], ["burst, pop", 21.98], ["explosion", 9.68]], null, null, null, null, null], "duration": [-0.06, 1.63, 1.52, 1.37, 8.02, 1.42, 2.17, 63.06, 10.11, 2.32, 12.44, 1.74, 1.43, 1.83, 2.88, -0.23]} \ No newline at end of file diff --git a/annotations_filtered/kHRSh7JOKxo_filtered.json b/annotations_filtered/kHRSh7JOKxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1a89c8ad685d60981f6160fd5855baedad1346b --- /dev/null +++ b/annotations_filtered/kHRSh7JOKxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [6.0, 6.62], [8.0, 9.81], [10.0, 11.43], [13.0, 13.49], [14.0, 16.07], [27.0, 28.0], [36.0, 37.61], [38.0, 38.48], [41.0, 40.98], [43.0, 43.88], [45.0, 45.1], [47.0, 48.78], [52.0, 52.49], [55.0, 56.0], [56.0, 57.03], [59.0, 61.1], [62.0, 62.45], [64.0, 65.28], [69.0, 69.75], [71.0, 72.23], [73.0, 75.14], [76.0, 78.04], [79.0, 79.41], [79.0, 79.47], [80.0, 82.17], [83.0, 84.38], [85.0, 87.88], [89.0, 90.05], [91.0, 91.3], [92.0, 93.11], [94.0, 94.07], [95.0, 96.4], [99.0, 100.67], [101.0, 103.13], [104.0, 106.61], [110.0, 114.0], [114.0, 115.87], [119.0, 120.83], [122.0, 123.16], [126.0, 128.49], [131.0, 132.31], [133.0, 133.91], [135.0, 137.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 98.66, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.62, 1.81, 1.43, 0.49, 2.07, 1.0, 1.61, 0.48, -0.02, 0.88, 0.1, 1.78, 0.49, 1.0, 1.03, 2.1, 0.45, 1.28, 0.75, 1.23, 2.14, 2.04, 0.41, 0.47, 2.17, 1.38, 2.88, 1.05, 0.3, 1.11, 0.07, 1.4, 1.67, 2.13, 2.61, 4.0, 1.87, 1.83, 1.16, 2.49, 1.31, 0.91, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/kHRe9qdfLsw_filtered.json b/annotations_filtered/kHRe9qdfLsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8a745f411b9fcc9046fcbb17c4e0c1d39408a38 --- /dev/null +++ b/annotations_filtered/kHRe9qdfLsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 51.51], [52.0, 74.46], [75.0, 75.88], [76.0, 83.15], [86.0, 145.2]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 57.89, 0.0, 46.83, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.08], ["theremin", 6.52], ["synthesizer", 6.41]], null], "duration": [0.51, 22.46, 0.88, 7.15, 59.2]} \ No newline at end of file diff --git a/annotations_filtered/kHTAJHod8-g_filtered.json b/annotations_filtered/kHTAJHod8-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fb6ac76c0169bb1e4704d8266e6317a864be87d --- /dev/null +++ b/annotations_filtered/kHTAJHod8-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.07], [18.0, 21.03], [22.0, 22.52], [32.0, 35.31], [36.0, 40.1], [43.0, 44.52], [47.0, 49.87], [51.0, 51.97], [54.0, 55.16], [63.0, 64.05], [70.0, 70.7], [71.0, 72.66], [74.0, 75.25], [76.0, 76.32], [79.0, 79.73], [91.0, 91.35], [93.0, 93.8], [106.0, 106.39], [112.0, 114.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 99.98, 99.93, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 3.03, 0.52, 3.31, 4.1, 1.52, 2.87, 0.97, 1.16, 1.05, 0.7, 1.66, 1.25, 0.32, 0.73, 0.35, 0.8, 0.39, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/kHk2-mOOYQg_filtered.json b/annotations_filtered/kHk2-mOOYQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0243251493b713207dd6ff77b4e331c380c541af --- /dev/null +++ b/annotations_filtered/kHk2-mOOYQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [7.0, 9.21], [10.0, 15.33], [31.0, 32.68], [33.0, 33.78], [43.0, 42.94], [46.0, 48.0], [52.0, 53.32], [54.0, 56.3], [57.0, 62.68], [63.0, 64.56], [66.0, 66.45], [71.0, 72.13], [74.0, 75.19], [82.0, 83.13], [85.0, 88.45], [90.0, 90.27], [92.0, 106.96], [111.0, 127.62], [129.0, 129.03]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.05, 44.93, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 37.47, 45.4, 0.0], "audiomae_on_audioset": [null, [["speech", 58.05], ["throbbing", 7.78], ["music", 5.13]], [["hum", 23.82], ["music", 15.04], ["throbbing", 14.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 81.26], ["reggae", 2.85], ["psychedelic rock", 1.34]], [["music", 60.96], ["fly, housefly", 8.85], ["insect", 5.3]], null], "duration": [0.45, 2.21, 5.33, 1.68, 0.78, -0.06, 2.0, 1.32, 2.3, 5.68, 1.56, 0.45, 1.13, 1.19, 1.13, 3.45, 0.27, 14.96, 16.62, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/kHq3y20HhRk_filtered.json b/annotations_filtered/kHq3y20HhRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0514f0423f45312bbcf70e508e1acc8c3cb62c0 --- /dev/null +++ b/annotations_filtered/kHq3y20HhRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.18], [25.0, 55.81], [61.0, 72.54], [74.0, 100.95]], "keep_status": [false, false, false, false], "silence_prob": [30.68, 0.0, 29.98, 30.26], "audiomae_on_audioset": [[["speech", 69.5], ["music", 4.69], ["hum", 3.98]], null, [["speech", 35.63], ["vehicle", 24.89], ["car", 15.54]], [["music", 47.95], ["speech", 27.81], ["cacophony", 6.48]]], "duration": [9.18, 30.81, 11.54, 26.95]} \ No newline at end of file diff --git a/annotations_filtered/kI9rnng7ns0_filtered.json b/annotations_filtered/kI9rnng7ns0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..441615180f5d881faf95846e9fb3b557cbc973e0 --- /dev/null +++ b/annotations_filtered/kI9rnng7ns0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [9.0, 12.14], [15.0, 16.09], [17.0, 19.74], [22.0, 55.51], [69.0, 71.47], [73.0, 75.76], [77.0, 77.92], [79.0, 81.31], [82.0, 83.83]], "keep_status": [false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 82.61, 0.0, 46.57, 0.0, 40.95, 40.22, 0.0, 70.16, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 22.57], ["speech", 20.34], ["music", 17.64]], null, [["music", 17.32], ["mains hum", 11.7], ["hum", 10.98]], [["whale vocalization", 16.12], ["hum", 11.13], ["chirp tone", 9.92]], null, null, null], "duration": [0.59, 3.14, 1.09, 2.74, 33.51, 2.47, 2.76, 0.92, 2.31, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/kIIY1-f_rBg_filtered.json b/annotations_filtered/kIIY1-f_rBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185fc877e1d26f497a1b6101a038f4d774456c53 --- /dev/null +++ b/annotations_filtered/kIIY1-f_rBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [2.0, 2.79], [3.0, 5.43], [9.0, 12.33], [28.0, 28.75], [36.0, 40.95], [41.0, 42.74], [44.0, 44.93], [47.0, 49.18], [51.0, 52.1], [55.0, 56.64], [58.0, 58.7], [61.0, 62.11], [64.0, 64.93], [67.0, 68.64], [70.0, 94.14], [95.0, 100.84], [106.0, 107.16], [110.0, 124.23], [129.0, 147.51], [150.0, 154.58]], "keep_status": [false, false, true, true, false, true, false, false, true, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 31.08, 29.0, 0.0, 33.07, 0.0, 0.0, 37.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 28.48, 0.0, 28.93, 28.96, 29.2], "audiomae_on_audioset": [null, null, [["music", 11.82], ["whale vocalization", 5.38], ["buzz", 5.22]], [["whack, thwack", 29.28], ["fly, housefly", 8.3], ["groan", 5.69]], null, [["livestock, farm animals, working animals", 32.27], ["whale vocalization", 12.34], ["cattle, bovinae", 8.08]], null, null, [["whale vocalization", 34.35], ["speech", 14.41], ["cattle, bovinae", 11.36]], null, null, null, null, null, null, [["music", 29.34], ["speech", 18.19], ["didgeridoo", 8.85]], [["music", 52.0], ["electronic music", 7.93], ["buzz", 4.38]], null, [["music", 40.76], ["cattle, bovinae", 11.36], ["speech", 11.29]], [["music", 72.39], ["electronic music", 4.21], ["throbbing", 3.83]], [["music", 63.66], ["speech", 5.25], ["electronic music", 4.44]]], "duration": [1.27, 0.79, 2.43, 3.33, 0.75, 4.95, 1.74, 0.93, 2.18, 1.1, 1.64, 0.7, 1.11, 0.93, 1.64, 24.14, 5.84, 1.16, 14.23, 18.51, 4.58]} \ No newline at end of file diff --git a/annotations_filtered/kIUgcwJeN5A_filtered.json b/annotations_filtered/kIUgcwJeN5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3c4db1db66361d9ccceb915a113b920890e0093 --- /dev/null +++ b/annotations_filtered/kIUgcwJeN5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.69], [36.0, 36.36], [46.0, 46.55], [49.0, 49.47], [50.0, 50.3], [53.0, 53.6], [56.0, 56.69], [58.0, 58.33], [60.0, 60.07], [63.0, 63.1], [63.0, 63.66], [78.0, 78.7], [84.0, 84.99], [87.0, 87.18], [91.0, 91.5], [95.0, 95.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.36, 0.55, 0.47, 0.3, 0.6, 0.69, 0.33, 0.07, 0.1, 0.66, 0.7, 0.99, 0.18, 0.5, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/kItLDGtPMMI_filtered.json b/annotations_filtered/kItLDGtPMMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37e7d7e9bae63bd73ae824c4304c7d26cc1aaece --- /dev/null +++ b/annotations_filtered/kItLDGtPMMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.39], [17.0, 17.41], [19.0, 19.5], [20.0, 19.58], [20.0, 19.65], [20.0, 20.73], [22.0, 26.59], [29.0, 29.02], [32.0, 32.53], [33.0, 35.26], [35.0, 41.79], [43.0, 44.47], [46.0, 51.36], [53.0, 55.07], [57.0, 60.71], [62.0, 64.2], [67.0, 70.65], [74.0, 90.0], [91.0, 91.5]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.07, 0.0, 0.0, 47.01, 76.86, 0.0, 84.25, 87.19, 92.15, 96.77, 95.37, 32.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 21.98], ["thunk", 20.2], ["music", 14.16]], null, null, [["speech", 33.51], ["bee, wasp, etc.", 6.27], ["fly, housefly", 5.01]], null, null, null, null, null, null, null, [["hum", 40.58], ["music", 11.51], ["mains hum", 10.03]], null], "duration": [1.39, 0.41, 0.5, -0.42, -0.35, 0.73, 4.59, 0.02, 0.53, 2.26, 6.79, 1.47, 5.36, 2.07, 3.71, 2.2, 3.65, 16.0, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/kJ-UZ4DvYBg_filtered.json b/annotations_filtered/kJ-UZ4DvYBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b802ae738f97bbe235e1cebd8aaf552a9270e2 --- /dev/null +++ b/annotations_filtered/kJ-UZ4DvYBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.07], [37.0, 37.4], [39.0, 38.92], [40.0, 41.55], [44.0, 44.56], [47.0, 49.74], [51.0, 58.24], [60.0, 63.36], [67.0, 67.19], [69.0, 69.04], [70.0, 71.63], [73.0, 73.7], [76.0, 78.61], [80.0, 81.01], [83.0, 86.14], [88.0, 89.21], [90.0, 91.88], [94.0, 95.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 36.8, 100.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["noise", 47.7], ["music", 23.31], ["hum", 8.85]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.4, -0.08, 1.55, 0.56, 2.74, 7.24, 3.36, 0.19, 0.04, 1.63, 0.7, 2.61, 1.01, 3.14, 1.21, 1.88, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/kJEvR6GEb7U_filtered.json b/annotations_filtered/kJEvR6GEb7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00baf8a4753cd63967ecf9c7b5f173ca8c51c3b4 --- /dev/null +++ b/annotations_filtered/kJEvR6GEb7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 67.58], [71.0, 74.02], [75.0, 82.58], [85.0, 86.34], [88.0, 90.56], [94.0, 95.57], [96.0, 101.34], [102.0, 105.76], [109.0, 114.83], [115.0, 116.23]], "keep_status": [false, true, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 29.18, 33.33, 0.0, 33.49, 0.0, 33.04, 31.58, 31.01, 0.0], "audiomae_on_audioset": [null, [["music", 34.57], ["vehicle", 12.54], ["car", 9.97]], [["screaming", 40.48], ["groan", 21.79], ["music", 14.28]], null, [["music", 23.59], ["mains hum", 20.01], ["hum", 18.82]], null, [["music", 56.78], ["synthesizer", 5.68], ["cacophony", 4.79]], [["fly, housefly", 18.14], ["insect", 17.47], ["speech", 14.62]], [["music", 41.83], ["mains hum", 29.64], ["hum", 13.86]], null], "duration": [32.58, 3.02, 7.58, 1.34, 2.56, 1.57, 5.34, 3.76, 5.83, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/kJKWjeMtEDM_filtered.json b/annotations_filtered/kJKWjeMtEDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b10868da6f192622d00918b704559a021dcbd508 --- /dev/null +++ b/annotations_filtered/kJKWjeMtEDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [3.0, 3.37], [5.0, 6.0], [7.0, 7.79], [10.0, 12.7], [17.0, 27.33], [28.0, 28.9], [31.0, 40.17], [40.0, 41.62], [42.0, 42.82], [45.0, 45.5], [48.0, 48.22], [50.0, 51.58], [53.0, 55.43], [60.0, 84.4], [89.0, 144.75], [146.0, 165.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.31, 52.74, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 33.73, 0.0, 35.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.53], ["electronic music", 4.77], ["throbbing", 4.7]], null, [["music", 48.85], ["speech", 14.54], ["cacophony", 7.66]]], "duration": [1.12, 0.37, 1.0, 0.79, 2.7, 10.33, 0.9, 9.17, 1.62, 0.82, 0.5, 0.22, 1.58, 2.43, 24.4, 55.75, 19.18]} \ No newline at end of file diff --git a/annotations_filtered/kJg3GP4tH94_filtered.json b/annotations_filtered/kJg3GP4tH94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b12717e96bf99fdb516234058f98f1b4ce1462 --- /dev/null +++ b/annotations_filtered/kJg3GP4tH94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.04], [12.0, 13.39], [14.0, 17.59], [18.0, 48.47], [50.0, 55.0], [56.0, 65.62], [67.0, 69.47], [70.0, 71.68], [74.0, 89.65], [99.0, 99.86], [103.0, 103.5], [104.0, 104.77], [107.0, 108.75], [111.0, 119.4], [120.0, 125.51]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, true, true], "silence_prob": [33.38, 0.0, 33.09, 0.0, 30.32, 33.57, 35.06, 0.0, 33.12, 0.0, 0.0, 0.0, 0.0, 39.72, 46.19], "audiomae_on_audioset": [[["music", 40.91], ["speech", 12.82], ["inside, small room", 2.93]], null, [["theremin", 51.33], ["music", 26.15], ["speech", 7.95]], null, [["music", 61.09], ["theremin", 6.15], ["musical instrument", 3.74]], [["music", 42.45], ["theremin", 28.42], ["speech", 5.82]], [["music", 49.94], ["theremin", 8.86], ["musical instrument", 5.85]], null, [["music", 55.65], ["musical instrument", 5.43], ["wind instrument, woodwind instrument", 2.28]], null, null, null, null, [["music", 36.64], ["speech", 9.46], ["throbbing", 5.87]], [["music", 43.61], ["mains hum", 11.44], ["hum", 10.94]]], "duration": [5.04, 1.39, 3.59, 30.47, 5.0, 9.62, 2.47, 1.68, 15.65, 0.86, 0.5, 0.77, 1.75, 8.4, 5.51]} \ No newline at end of file diff --git a/annotations_filtered/kJlqNXhZE_I_filtered.json b/annotations_filtered/kJlqNXhZE_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e874411dc5d432b8cc9cc4040dd0ae4ab5c4d39a --- /dev/null +++ b/annotations_filtered/kJlqNXhZE_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.67], [8.0, 7.77], [10.0, 12.56], [13.0, 19.74], [23.0, 24.97], [28.0, 29.61], [32.0, 32.37], [41.0, 40.74], [41.0, 41.54], [42.0, 44.51], [45.0, 47.65], [49.0, 50.87], [53.0, 82.09], [88.0, 87.81], [93.0, 104.04], [105.0, 107.79], [122.0, 130.77], [169.0, 171.22]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [55.39, 0.0, 62.47, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 34.18, 48.52, 0.0, 42.58, 0.0, 33.97, 32.0, 34.06, 36.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 41.53], ["music", 10.84], ["speech synthesizer", 6.51]], [["mains hum", 32.02], ["hum", 18.71], ["busy signal", 12.53]], null, [["music", 77.22], ["boing", 2.34], ["thunk", 1.64]], null, [["sheep", 16.21], ["bleat", 10.11], ["screaming", 9.89]], [["livestock, farm animals, working animals", 78.88], ["moo", 9.71], ["cattle, bovinae", 5.87]], [["moo", 47.24], ["cattle, bovinae", 23.32], ["livestock, farm animals, working animals", 11.82]], [["music", 67.57], ["musical instrument", 3.62], ["cacophony", 2.4]]], "duration": [3.67, -0.23, 2.56, 6.74, 1.97, 1.61, 0.37, -0.26, 0.54, 2.51, 2.65, 1.87, 29.09, -0.19, 11.04, 2.79, 8.77, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/kJnH45GslL0_filtered.json b/annotations_filtered/kJnH45GslL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c488781e4d62feb2a4cc2f670e95e53e950fd573 --- /dev/null +++ b/annotations_filtered/kJnH45GslL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [8.0, 9.27], [14.0, 33.99], [35.0, 36.69], [41.0, 41.39], [45.0, 45.66], [49.0, 52.59], [57.0, 70.61], [72.0, 71.86], [74.0, 75.19], [76.0, 76.82], [79.0, 79.2], [79.0, 79.24], [82.0, 82.71], [86.0, 90.91], [92.0, 102.84], [105.0, 105.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.54, 0.0, 0.0, 0.0, 88.46, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.81, 30.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.79], ["mains hum", 5.67], ["sonar", 3.45]], [["music", 76.82], ["speech", 6.74], ["throbbing", 2.09]], null], "duration": [1.62, 1.27, 19.99, 1.69, 0.39, 0.66, 3.59, 13.61, -0.14, 1.19, 0.82, 0.2, 0.24, 0.71, 4.91, 10.84, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/kJzOYZNQv6M_filtered.json b/annotations_filtered/kJzOYZNQv6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88c88520fc92e579220c598aa0aca8329516fe08 --- /dev/null +++ b/annotations_filtered/kJzOYZNQv6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 35.75], [37.0, 37.34], [45.0, 60.05], [62.0, 71.14], [73.0, 85.87], [88.0, 89.87], [90.0, 115.77], [124.0, 127.41], [130.0, 136.95], [137.0, 143.23]], "keep_status": [true, false, true, true, false, false, false, true, true, true], "silence_prob": [32.12, 0.0, 32.15, 33.17, 32.67, 0.0, 32.08, 31.09, 30.43, 37.34], "audiomae_on_audioset": [[["speech", 38.04], ["mains hum", 14.85], ["hum", 6.39]], null, [["music", 35.32], ["speech", 21.45], ["electric shaver, electric razor", 3.56]], [["music", 34.07], ["whack, thwack", 25.58], ["speech", 8.17]], [["music", 53.07], ["breaking", 11.74], ["smash, crash", 9.32]], null, [["speech", 43.74], ["music", 23.85], ["whack, thwack", 2.71]], [["music", 32.41], ["whale vocalization", 6.76], ["vehicle", 3.88]], [["music", 16.08], ["hum", 15.09], ["buzz", 13.97]], [["speech", 30.61], ["music", 20.26], ["hum", 9.52]]], "duration": [25.75, 0.34, 15.05, 9.14, 12.87, 1.87, 25.77, 3.41, 6.95, 6.23]} \ No newline at end of file diff --git a/annotations_filtered/kK6QQIvO9gE_filtered.json b/annotations_filtered/kK6QQIvO9gE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49bfac0e5a77b215b98a64de143dbfd1c14abe1e --- /dev/null +++ b/annotations_filtered/kK6QQIvO9gE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.82], [43.0, 47.36], [52.0, 53.76], [55.0, 65.38], [66.0, 68.55]], "keep_status": [false, false, false, true, true], "silence_prob": [0.0, 55.89, 0.0, 47.62, 44.32], "audiomae_on_audioset": [null, null, null, [["noise", 18.27], ["hum", 13.67], ["sidetone", 13.13]], [["music", 22.25], ["didgeridoo", 13.73], ["hum", 13.55]]], "duration": [1.82, 4.36, 1.76, 10.38, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/kKBsDfBDmG0_filtered.json b/annotations_filtered/kKBsDfBDmG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b8fed6a04d890887c399b3bc623e56a69d6f0c --- /dev/null +++ b/annotations_filtered/kKBsDfBDmG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [15.0, 14.93], [21.0, 23.84], [28.0, 28.56], [34.0, 36.27], [39.0, 39.92], [42.0, 44.0], [45.0, 45.77], [50.0, 52.3], [53.0, 53.32], [56.0, 65.35], [67.0, 67.46], [70.0, 69.74], [72.0, 74.07], [81.0, 81.77], [87.0, 89.75], [96.0, 95.84], [101.0, 101.73], [104.0, 103.84], [104.0, 105.14], [107.0, 107.45], [114.0, 114.54], [115.0, 116.73], [129.0, 130.77], [142.0, 143.56], [144.0, 145.2], [147.0, 149.71], [152.0, 152.58], [153.0, 154.92], [157.0, 157.64], [163.0, 165.86]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.52, 0.0, 99.98, 0.0, 100.0, 0.0, 45.78, 0.0, 43.43, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 40.55], "audiomae_on_audioset": [null, null, [["whack, thwack", 41.61], ["smash, crash", 19.55], ["breaking", 14.18]], null, null, null, null, null, [["speech", 49.86], ["inside, small room", 3.42], ["animal", 3.35]], null, [["mains hum", 26.7], ["hum", 25.91], ["speech", 21.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.05], ["singing bowl", 14.06], ["hum", 7.69]]], "duration": [1.07, -0.07, 2.84, 0.56, 2.27, 0.92, 2.0, 0.77, 2.3, 0.32, 9.35, 0.46, -0.26, 2.07, 0.77, 2.75, -0.16, 0.73, -0.16, 1.14, 0.45, 0.54, 1.73, 1.77, 1.56, 1.2, 2.71, 0.58, 1.92, 0.64, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/kKC8076NZOY_filtered.json b/annotations_filtered/kKC8076NZOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96016b92ef39202de79bff5460a4d0aa3fbd2b93 --- /dev/null +++ b/annotations_filtered/kKC8076NZOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.27], [7.0, 7.69], [8.0, 11.94], [12.0, 13.1], [14.0, 15.09], [17.0, 17.58], [29.0, 30.23], [32.0, 33.42], [34.0, 34.37], [37.0, 39.87], [41.0, 41.84], [43.0, 46.3], [48.0, 47.98], [56.0, 57.7], [59.0, 59.66], [61.0, 65.55], [68.0, 68.17], [71.0, 77.53], [81.0, 83.37], [85.0, 91.22], [94.0, 102.61], [103.0, 102.64], [103.0, 102.68], [103.0, 102.71], [106.0, 106.29], [107.0, 107.16]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [43.56, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 36.87, 0.0, 0.0, 0.0, 35.65, 0.0, 36.1, 37.14, 33.42, 38.23, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 29.13], ["cattle, bovinae", 24.42], ["livestock, farm animals, working animals", 9.02]], null, [["speech", 46.75], ["music", 20.43], ["boing", 11.12]], null, null, null, null, null, null, null, null, [["music", 72.38], ["musical instrument", 4.25], ["speech", 2.99]], null, null, null, [["hum", 24.28], ["mains hum", 22.45], ["music", 11.63]], null, [["throbbing", 33.22], ["music", 32.43], ["hum", 12.12]], [["music", 33.89], ["speech", 28.03], ["electronic music", 2.55]], [["cattle, bovinae", 33.01], ["livestock, farm animals, working animals", 31.93], ["moo", 19.64]], [["speech", 44.37], ["fly, housefly", 11.81], ["insect", 9.92]], null, null, null, null, null], "duration": [2.27, 0.69, 3.94, 1.1, 1.09, 0.58, 1.23, 1.42, 0.37, 2.87, 0.84, 3.3, -0.02, 1.7, 0.66, 4.55, 0.17, 6.53, 2.37, 6.22, 8.61, -0.36, -0.32, -0.29, 0.29, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/kKHr9gSW7HM_filtered.json b/annotations_filtered/kKHr9gSW7HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28d498c3c24de3699a5557a35a56db948ae0c3fb --- /dev/null +++ b/annotations_filtered/kKHr9gSW7HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [4.0, 6.12], [10.0, 12.07], [14.0, 16.38], [19.0, 19.67], [26.0, 26.91], [28.0, 29.05], [31.0, 38.26], [39.0, 41.77], [42.0, 43.97], [48.0, 48.19], [49.0, 49.86], [57.0, 58.94], [61.0, 62.48], [64.0, 64.99], [65.0, 65.97], [67.0, 67.59], [71.0, 73.55], [75.0, 77.45], [81.0, 84.06], [88.0, 89.87], [91.0, 92.25], [95.0, 95.67], [100.0, 101.63], [104.0, 106.17], [107.0, 112.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 86.64, 83.16, 0.0, 0.0, 0.0, 0.0, 92.8, 83.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 2.12, 2.07, 2.38, 0.67, 0.91, 1.05, 7.26, 2.77, 1.97, 0.19, 0.86, 1.94, 1.48, 0.99, 0.97, 0.59, 2.55, 2.45, 3.06, 1.87, 1.25, 0.67, 1.63, 2.17, 5.97]} \ No newline at end of file diff --git a/annotations_filtered/kKUsYDTykUQ_filtered.json b/annotations_filtered/kKUsYDTykUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86770e89d2c350824c66c64df2368029a361dd10 --- /dev/null +++ b/annotations_filtered/kKUsYDTykUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 62.36], [64.0, 64.67], [66.0, 67.86], [68.0, 120.8]], "keep_status": [true, false, false, false], "silence_prob": [28.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 40.43], ["buzz", 12.07], ["music", 9.29]], null, null, null], "duration": [29.36, 0.67, 1.86, 52.8]} \ No newline at end of file diff --git a/annotations_filtered/kKlihXmSqPE_filtered.json b/annotations_filtered/kKlihXmSqPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be135538895100774f07a65180a009784bf731e1 --- /dev/null +++ b/annotations_filtered/kKlihXmSqPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.77], [7.0, 7.67], [9.0, 9.31], [11.0, 12.9], [14.0, 18.01], [19.0, 20.24], [21.0, 27.26], [28.0, 29.0], [30.0, 31.28], [32.0, 34.01], [35.0, 35.53], [37.0, 37.88], [39.0, 47.9], [48.0, 58.23], [59.0, 61.23], [62.0, 64.07], [69.0, 72.2], [74.0, 75.96], [79.0, 80.55], [82.0, 83.13], [84.0, 85.33], [87.0, 87.64], [88.0, 89.18], [91.0, 92.04], [93.0, 94.53], [95.0, 95.47], [96.0, 96.58], [97.0, 100.48], [104.0, 104.75], [106.0, 106.1], [110.0, 110.67], [114.0, 113.81], [115.0, 117.42], [119.0, 119.01], [122.0, 123.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 89.01, 0.0, 0.0, 98.01, 0.0, 0.0, 100.0, 80.82, 100.0, 99.97, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.67, 0.31, 1.9, 4.01, 1.24, 6.26, 1.0, 1.28, 2.01, 0.53, 0.88, 8.9, 10.23, 2.23, 2.07, 3.2, 1.96, 1.55, 1.13, 1.33, 0.64, 1.18, 1.04, 1.53, 0.47, 0.58, 3.48, 0.75, 0.1, 0.67, -0.19, 2.42, 0.01, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/kL8e9CEgm6A_filtered.json b/annotations_filtered/kL8e9CEgm6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d79d27da9accd9bba413ebd0868c55e152a272 --- /dev/null +++ b/annotations_filtered/kL8e9CEgm6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [6.0, 6.71], [9.0, 9.9], [11.0, 13.14], [19.0, 19.79], [22.0, 26.54], [27.0, 28.7], [29.0, 29.83], [32.0, 33.3], [35.0, 37.23], [40.0, 40.71], [44.0, 49.45], [50.0, 50.97], [53.0, 53.23], [54.0, 54.57], [56.0, 56.56], [58.0, 59.17], [65.0, 65.18], [72.0, 72.57], [89.0, 101.09], [103.0, 116.14], [117.0, 130.52], [133.0, 134.27], [135.0, 135.73], [138.0, 138.57], [140.0, 140.7], [141.0, 142.84], [144.0, 150.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 82.97, 0.0, 86.09, 0.0, 0.0, 0.0, 75.72, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.32, 29.41, 30.66, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.28], ["hum", 23.51], ["mains hum", 11.92]], [["music", 47.09], ["speech", 40.72], ["hum", 2.3]], [["music", 78.87], ["hum", 5.74], ["throbbing", 2.85]], null, null, null, null, null, null], "duration": [0.78, 0.71, 0.9, 2.14, 0.79, 4.54, 1.7, 0.83, 1.3, 2.23, 0.71, 5.45, 0.97, 0.23, 0.57, 0.56, 1.17, 0.18, 0.57, 12.09, 13.14, 13.52, 1.27, 0.73, 0.57, 0.7, 1.84, 6.97]} \ No newline at end of file diff --git a/annotations_filtered/kLJCWb1apYo_filtered.json b/annotations_filtered/kLJCWb1apYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14a611d200bce0cf261db431d5d3cbfe54d6a034 --- /dev/null +++ b/annotations_filtered/kLJCWb1apYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [7.0, 7.37], [9.0, 10.34], [12.0, 12.88], [27.0, 36.56], [38.0, 38.26], [43.0, 48.3], [53.0, 54.28], [56.0, 85.33], [87.0, 100.08], [100.0, 101.22], [104.0, 106.2], [108.0, 108.09]], "keep_status": [false, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 38.2, 0.0, 30.26, 32.04, 0.0, 74.13, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 50.84], ["vehicle", 9.63], ["rumble", 6.59]], null, [["music", 43.57], ["didgeridoo", 16.04], ["theremin", 9.06]], null, [["music", 77.14], ["electronic music", 5.95], ["throbbing", 5.71]], [["speech", 39.2], ["music", 16.46], ["theremin", 11.78]], null, null, null], "duration": [1.12, 0.37, 1.34, 0.88, 9.56, 0.26, 5.3, 1.28, 29.33, 13.08, 1.22, 2.2, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/kLNdMY1JlR0_filtered.json b/annotations_filtered/kLNdMY1JlR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e46587db3ce1ad6705911e390976b7e252eb5dbf --- /dev/null +++ b/annotations_filtered/kLNdMY1JlR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [6.0, 7.6], [10.0, 10.56], [17.0, 17.39], [20.0, 20.93], [23.0, 23.97], [31.0, 31.21], [38.0, 41.28], [43.0, 42.87]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 49.28], ["applause", 13.16], ["fart", 3.69]], null], "duration": [1.5, 1.6, 0.56, 0.39, 0.93, 0.97, 0.21, 3.28, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/kLjET9nE2dQ_filtered.json b/annotations_filtered/kLjET9nE2dQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ade54b575db6870eb12fd46770aeccadffd16051 --- /dev/null +++ b/annotations_filtered/kLjET9nE2dQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.34], [18.0, 31.43], [35.0, 47.71], [48.0, 51.51], [54.0, 54.51], [57.0, 60.44], [69.0, 78.14], [79.0, 80.38], [81.0, 83.81]], "keep_status": [false, false, true, true, false, true, false, false, true], "silence_prob": [31.31, 31.9, 32.47, 30.95, 0.0, 35.47, 36.89, 0.0, 30.67], "audiomae_on_audioset": [[["speech", 37.11], ["whack, thwack", 24.01], ["groan", 14.0]], [["speech", 59.68], ["whack, thwack", 16.75], ["thump, thud", 3.94]], [["speech", 32.68], ["whack, thwack", 23.74], ["breaking", 10.47]], [["whack, thwack", 29.01], ["music", 18.1], ["smash, crash", 11.14]], null, [["speech", 40.44], ["hum", 14.32], ["mains hum", 8.48]], [["throbbing", 43.52], ["music", 16.68], ["hum", 13.0]], null, [["music", 32.99], ["hum", 8.8], ["reverberation", 5.96]]], "duration": [7.34, 13.43, 12.71, 3.51, 0.51, 3.44, 9.14, 1.38, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/kLovCSv9-Ks_filtered.json b/annotations_filtered/kLovCSv9-Ks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0805670a4c2f0cdeeef00b06487eb75e2290066e --- /dev/null +++ b/annotations_filtered/kLovCSv9-Ks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.39], [19.0, 21.07], [22.0, 23.21], [25.0, 27.38], [30.0, 31.04], [32.0, 37.07], [39.0, 40.96], [44.0, 70.44], [77.0, 96.2], [100.0, 100.09], [104.0, 105.02], [107.0, 107.77], [112.0, 112.24], [121.0, 122.61], [123.0, 127.55]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 85.35, 0.0, 53.47, 0.0, 36.19, 29.8, 0.0, 0.0, 0.0, 0.0, 0.0, 54.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 93.05], ["sine wave", 1.51], ["chirp tone", 1.27]], [["music", 64.22], ["jingle, tinkle", 2.26], ["noise", 2.17]], null, null, null, null, null, null], "duration": [0.39, 2.07, 1.21, 2.38, 1.04, 5.07, 1.96, 26.44, 19.2, 0.09, 1.02, 0.77, 0.24, 1.61, 4.55]} \ No newline at end of file diff --git a/annotations_filtered/kMalrBgdRvI_filtered.json b/annotations_filtered/kMalrBgdRvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29dfbc5efdb3ab53dbd001d54cefff9661ad8731 --- /dev/null +++ b/annotations_filtered/kMalrBgdRvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.38], [13.0, 13.76], [14.0, 14.94], [18.0, 18.87], [23.0, 24.68], [29.0, 32.66], [36.0, 41.77], [43.0, 45.77], [47.0, 49.3], [51.0, 86.02]], "keep_status": [false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.18, 31.5, 29.36, 29.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 29.17], ["throbbing", 19.8], ["speech", 8.78]], [["speech", 35.2], ["vehicle", 20.92], ["music", 15.35]], [["music", 54.43], ["static", 3.36], ["electronic music", 3.16]], [["music", 64.42], ["theremin", 3.7], ["didgeridoo", 3.12]], null], "duration": [0.38, 0.76, 0.94, 0.87, 1.68, 3.66, 5.77, 2.77, 2.3, 35.02]} \ No newline at end of file diff --git a/annotations_filtered/kMcvRpOOIwY_filtered.json b/annotations_filtered/kMcvRpOOIwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9c3a56b40987c7e9956d8ded776b529d6d0f972 --- /dev/null +++ b/annotations_filtered/kMcvRpOOIwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.34], [13.0, 13.83], [17.0, 56.57], [60.0, 95.2], [96.0, 98.59], [102.0, 106.64], [108.0, 118.59], [122.0, 122.28], [123.0, 129.61], [131.0, 153.06], [155.0, 164.61]], "keep_status": [false, false, false, false, true, true, false, false, true, true, false], "silence_prob": [29.78, 0.0, 0.0, 0.0, 31.7, 28.87, 29.24, 0.0, 29.19, 29.38, 28.93], "audiomae_on_audioset": [[["music", 84.23], ["quack", 3.29], ["animal", 1.67]], null, null, null, [["music", 21.35], ["sine wave", 7.38], ["moo", 7.02]], [["cattle, bovinae", 20.72], ["moo", 20.5], ["speech", 14.16]], [["groan", 38.75], ["music", 27.34], ["whack, thwack", 4.76]], null, [["music", 25.44], ["cattle, bovinae", 10.1], ["sheep", 7.78]], [["music", 54.89], ["speech", 5.67], ["didgeridoo", 4.2]], [["music", 76.01], ["cacophony", 2.25], ["speech", 1.5]]], "duration": [5.34, 0.83, 39.57, 35.2, 2.59, 4.64, 10.59, 0.28, 6.61, 22.06, 9.61]} \ No newline at end of file diff --git a/annotations_filtered/kMkxtj-mu14_filtered.json b/annotations_filtered/kMkxtj-mu14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..525d986931ff30501a9c997289030ff834fbeda4 --- /dev/null +++ b/annotations_filtered/kMkxtj-mu14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.14], [25.0, 25.32], [30.0, 30.38], [37.0, 37.35], [38.0, 38.82], [65.0, 66.01], [68.0, 68.82], [71.0, 71.1], [89.0, 91.86], [96.0, 107.62], [108.0, 108.67], [110.0, 110.25], [121.0, 121.66], [122.0, 122.67], [124.0, 123.72], [125.0, 125.83]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 42.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 32.88], ["speech", 4.98], ["musical instrument", 4.18]], [["music", 68.74], ["hum", 4.8], ["speech", 4.03]], null, null, null, null, null, null], "duration": [1.14, 0.32, 0.38, 0.35, 0.82, 1.01, 0.82, 0.1, 2.86, 11.62, 0.67, 0.25, 0.66, 0.67, -0.28, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/kNMc5CKw4G0_filtered.json b/annotations_filtered/kNMc5CKw4G0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c3ad088204c7ba09aabbabf2afa25017a9865de --- /dev/null +++ b/annotations_filtered/kNMc5CKw4G0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [5.0, 6.0], [19.0, 19.62], [29.0, 29.91], [31.0, 31.21], [34.0, 34.84], [36.0, 36.71], [38.0, 37.72], [39.0, 39.21], [40.0, 40.63], [47.0, 47.41], [49.0, 49.32], [50.0, 50.67], [52.0, 51.7], [52.0, 53.47], [62.0, 62.73], [64.0, 64.42], [65.0, 66.09], [67.0, 67.44], [71.0, 71.68], [75.0, 80.16], [81.0, 81.3], [82.0, 82.48], [86.0, 86.81], [87.0, 87.37], [103.0, 103.27], [111.0, 111.86], [113.0, 114.37], [115.0, 116.38], [117.0, 117.42], [119.0, 119.43], [120.0, 120.77], [122.0, 124.04], [127.0, 128.17], [128.0, 128.24], [132.0, 132.95], [133.0, 134.01], [135.0, 135.38], [136.0, 136.48], [137.0, 137.05], [138.0, 138.5], [140.0, 140.17], [140.0, 140.43], [141.0, 142.18], [143.0, 144.44], [145.0, 146.06], [150.0, 150.45], [159.0, 159.97], [166.0, 167.48], [175.0, 176.07], [181.0, 180.76], [182.0, 182.44], [184.0, 184.65], [186.0, 188.23], [190.0, 190.17], [191.0, 191.83], [194.0, 194.75], [196.0, 199.74], [204.0, 205.87], [207.0, 208.35], [210.0, 210.71], [212.0, 211.74], [213.0, 213.16], [221.0, 222.13], [225.0, 226.08], [227.0, 228.7], [229.0, 228.73], [229.0, 228.77], [229.0, 230.96], [234.0, 238.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.63], ["speech", 22.59], ["musical instrument", 5.41]]], "duration": [1.01, 1.0, 0.62, 0.91, 0.21, 0.84, 0.71, -0.28, 0.21, 0.63, 0.41, 0.32, 0.67, -0.3, 1.47, 0.73, 0.42, 1.09, 0.44, 0.68, 5.16, 0.3, 0.48, 0.81, 0.37, 0.27, 0.86, 1.37, 1.38, 0.42, 0.43, 0.77, 2.04, 1.17, 0.24, 0.95, 1.01, 0.38, 0.48, 0.05, 0.5, 0.17, 0.43, 1.18, 1.44, 1.06, 0.45, 0.97, 1.48, 1.07, -0.24, 0.44, 0.65, 2.23, 0.17, 0.83, 0.75, 3.74, 1.87, 1.35, 0.71, -0.26, 0.16, 1.13, 1.08, 1.7, -0.27, -0.23, 1.96, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/kNpbZ_oVHxE_filtered.json b/annotations_filtered/kNpbZ_oVHxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e780c80c81db05ff4620e50fa44ff80f6cbc067 --- /dev/null +++ b/annotations_filtered/kNpbZ_oVHxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 7.28], [10.0, 12.48], [15.0, 16.14], [21.0, 21.49], [24.0, 24.95], [27.0, 28.32], [32.0, 33.74], [35.0, 38.2], [42.0, 45.69], [47.0, 49.42], [52.0, 59.04]], "keep_status": [false, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 36.37, 37.27, 0.0, 0.0, 0.0, 0.0, 0.0, 40.54, 33.18, 34.53, 35.39], "audiomae_on_audioset": [null, [["throbbing", 18.87], ["music", 10.47], ["hum", 7.2]], [["music", 48.59], ["theremin", 21.86], ["hammond organ", 3.78]], null, null, null, null, null, [["music", 54.29], ["musical instrument", 3.61], ["foghorn", 3.12]], [["music", 30.6], ["speech", 21.78], ["synthesizer", 11.76]], [["music", 27.62], ["foghorn", 5.08], ["speech", 3.45]], [["music", 60.23], ["speech", 9.64], ["theremin", 8.07]]], "duration": [1.3, 2.28, 2.48, 1.14, 0.49, 0.95, 1.32, 1.74, 3.2, 3.69, 2.42, 7.04]} \ No newline at end of file diff --git a/annotations_filtered/kNtopT3-5t0_filtered.json b/annotations_filtered/kNtopT3-5t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889c310a0ad0dfdcb959271ac078c46ae2abd017 --- /dev/null +++ b/annotations_filtered/kNtopT3-5t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.3], [47.0, 47.51], [54.0, 56.61], [75.0, 75.56], [76.0, 76.76], [78.0, 82.59], [85.0, 86.7], [90.0, 91.13], [102.0, 103.45], [113.0, 113.88], [117.0, 117.69], [125.0, 126.17], [134.0, 134.28], [137.0, 138.18], [143.0, 143.02], [159.0, 160.44], [163.0, 165.42], [175.0, 175.59], [177.0, 182.73]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.17, 0.0, 0.0, 41.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.29, 0.0, 69.47], "audiomae_on_audioset": [null, null, [["speech", 44.92], ["music", 16.11], ["boing", 9.86]], null, null, [["music", 39.96], ["synthesizer", 19.04], ["musical instrument", 8.49]], null, null, null, null, null, null, null, null, null, null, [["music", 56.27], ["synthesizer", 9.44], ["speech", 5.64]], null, null], "duration": [0.3, 0.51, 2.61, 0.56, 0.76, 4.59, 1.7, 1.13, 1.45, 0.88, 0.69, 1.17, 0.28, 1.18, 0.02, 1.44, 2.42, 0.59, 5.73]} \ No newline at end of file diff --git a/annotations_filtered/kO0kWTR_7tQ_filtered.json b/annotations_filtered/kO0kWTR_7tQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5314e0f312f35d26ef49b59015779929f0949e9 --- /dev/null +++ b/annotations_filtered/kO0kWTR_7tQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 4.77], [6.0, 6.34], [28.0, 28.05], [30.0, 30.38], [31.0, 31.77], [35.0, 36.0], [43.0, 43.5], [48.0, 55.44], [56.0, 57.79], [59.0, 60.27], [65.0, 64.69], [72.0, 72.55], [82.0, 83.2], [91.0, 94.12], [98.0, 97.9], [99.0, 100.23], [106.0, 109.86], [117.0, 118.27], [122.0, 122.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 40.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cowbell", 20.47], ["cattle, bovinae", 10.22], ["speech", 8.45]], null, null], "duration": [0.54, 0.77, 0.34, 0.05, 0.38, 0.77, 1.0, 0.5, 7.44, 1.79, 1.27, -0.31, 0.55, 1.2, 3.12, -0.1, 1.23, 3.86, 1.27, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/kOBAOfh46Nk_filtered.json b/annotations_filtered/kOBAOfh46Nk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f691554c9a371f51d91cf329182cdbcfcf3910fc --- /dev/null +++ b/annotations_filtered/kOBAOfh46Nk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.21], [7.0, 13.66], [16.0, 16.85], [17.0, 18.2], [22.0, 100.16], [102.0, 106.03]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 51.44, 0.0, 0.0, 0.0, 33.52], "audiomae_on_audioset": [null, null, null, null, null, [["moo", 23.3], ["cattle, bovinae", 19.22], ["livestock, farm animals, working animals", 7.41]]], "duration": [0.21, 6.66, 0.85, 1.2, 78.16, 4.03]} \ No newline at end of file diff --git a/annotations_filtered/kOe-yLCbA4E_filtered.json b/annotations_filtered/kOe-yLCbA4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eeb0e18030af615f8f2835a4cd70af810196098 --- /dev/null +++ b/annotations_filtered/kOe-yLCbA4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 6.3], [10.0, 16.31], [18.0, 36.88], [38.0, 38.3], [44.0, 44.68], [46.0, 46.06], [48.0, 48.56], [49.0, 55.32], [56.0, 55.93], [57.0, 58.18], [60.0, 69.7], [72.0, 73.28], [74.0, 76.49], [82.0, 81.58], [84.0, 84.35], [86.0, 88.13], [92.0, 95.71], [96.0, 96.38], [100.0, 100.52], [102.0, 102.79], [103.0, 103.57], [108.0, 110.07], [111.0, 111.94], [113.0, 112.9], [114.0, 116.94], [117.0, 117.61], [118.0, 128.58], [133.0, 142.5], [144.0, 144.37], [145.0, 145.77], [150.0, 153.96], [155.0, 155.92]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 78.04, 46.19, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 32.61, 0.0, 38.75, 0.0, 0.0, 66.51, 35.31, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 49.22, 0.0, 50.97, 38.88, 0.0, 0.0, 37.02, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 22.52], ["speech", 10.61], ["hum", 8.81]], null, null, null, null, null, null, null, [["music", 73.43], ["brass instrument", 2.92], ["musical instrument", 2.54]], null, [["didgeridoo", 43.9], ["music", 16.68], ["chop", 4.35]], null, null, null, [["music", 27.1], ["speech", 22.34], ["didgeridoo", 18.85]], null, null, null, null, null, null, null, [["noise", 14.61], ["music", 8.65], ["mains hum", 6.11]], null, null, [["music", 64.47], ["wind instrument, woodwind instrument", 4.45], ["brass instrument", 3.19]], null, null, [["noise", 18.82], ["mains hum", 16.67], ["hum", 16.48]], null], "duration": [1.96, 1.3, 6.31, 18.88, 0.3, 0.68, 0.06, 0.56, 6.32, -0.07, 1.18, 9.7, 1.28, 2.49, -0.42, 0.35, 2.13, 3.71, 0.38, 0.52, 0.79, 0.57, 2.07, 0.94, -0.1, 2.94, 0.61, 10.58, 9.5, 0.37, 0.77, 3.96, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/kOfY6wIKT40_filtered.json b/annotations_filtered/kOfY6wIKT40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71b544fafc805a4dd67c9ccc853ebc6273da2b63 --- /dev/null +++ b/annotations_filtered/kOfY6wIKT40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [4.0, 4.09], [5.0, 9.42], [11.0, 11.25], [13.0, 15.38], [16.0, 17.64], [20.0, 20.14], [21.0, 21.68], [27.0, 26.62], [32.0, 32.41], [33.0, 43.44], [45.0, 45.89], [47.0, 47.48], [48.0, 48.49], [49.0, 49.84], [51.0, 51.17], [52.0, 52.84], [54.0, 54.97], [58.0, 59.19], [60.0, 61.3], [62.0, 62.51], [64.0, 64.93], [65.0, 67.46], [68.0, 75.56], [77.0, 77.8], [79.0, 79.66], [84.0, 84.2], [85.0, 85.33], [88.0, 88.82], [91.0, 91.69], [95.0, 94.91], [96.0, 96.2], [97.0, 98.29], [99.0, 100.04], [103.0, 104.6], [105.0, 105.43], [105.0, 106.39], [108.0, 109.17], [110.0, 110.05], [110.0, 110.59], [111.0, 112.11], [113.0, 113.24], [114.0, 114.89], [116.0, 116.95], [119.0, 118.93], [120.0, 120.7], [122.0, 123.84], [125.0, 129.78], [130.0, 130.81], [132.0, 133.08], [134.0, 134.96], [137.0, 144.46], [146.0, 146.57], [152.0, 156.02], [158.0, 158.62], [159.0, 161.64], [165.0, 166.01], [166.0, 167.29], [168.0, 177.09], [178.0, 179.41]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.2, 0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 0.0, 48.35, 0.0, 48.44, 0.0, 60.14, 0.0, 0.0, 49.45, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.8], ["musical instrument", 11.14], ["guitar", 10.74]], null, [["theremin", 55.33], ["music", 19.16], ["speech", 14.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 55.38], ["music", 24.99], ["synthesizer", 3.99]], null, [["theremin", 47.35], ["music", 34.1], ["synthesizer", 5.32]], null, null, null, null, [["theremin", 56.85], ["music", 20.41], ["synthesizer", 6.3]], null], "duration": [0.49, 0.09, 4.42, 0.25, 2.38, 1.64, 0.14, 0.68, -0.38, 0.41, 10.44, 0.89, 0.48, 0.49, 0.84, 0.17, 0.84, 0.97, 1.19, 1.3, 0.51, 0.93, 2.46, 7.56, 0.8, 0.66, 0.2, 0.33, 0.82, 0.69, -0.09, 0.2, 1.29, 1.04, 1.6, 0.43, 1.39, 1.17, 0.05, 0.59, 1.11, 0.24, 0.89, 0.95, -0.07, 0.7, 1.84, 4.78, 0.81, 1.08, 0.96, 7.46, 0.57, 4.02, 0.62, 2.64, 1.01, 1.29, 9.09, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/kP5GKIrGoeQ_filtered.json b/annotations_filtered/kP5GKIrGoeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d28419f9ba27271ebc67af7d76dde4e782e44f22 --- /dev/null +++ b/annotations_filtered/kP5GKIrGoeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.48], [11.0, 12.21], [13.0, 22.2], [24.0, 25.91], [27.0, 28.98], [30.0, 35.56], [36.0, 44.91], [46.0, 46.5], [47.0, 49.91], [52.0, 53.91], [55.0, 57.45], [58.0, 59.78], [60.0, 61.72], [62.0, 66.34], [68.0, 71.12], [73.0, 74.17], [74.0, 77.38], [79.0, 82.34], [84.0, 86.76], [88.0, 89.58], [90.0, 94.71], [96.0, 96.79], [97.0, 99.87], [104.0, 105.29], [107.0, 107.99], [112.0, 115.97], [117.0, 119.69], [122.0, 123.7], [124.0, 125.88], [127.0, 129.76], [131.0, 135.65], [138.0, 139.72], [141.0, 149.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.81, 0.0, 81.89, 0.0, 0.0, 99.16, 78.55, 0.0, 71.72, 0.0, 99.44, 0.0, 0.0, 57.89, 97.33, 0.0, 71.29, 98.73, 69.34, 0.0, 76.53, 0.0, 81.17, 0.0, 0.0, 70.86, 92.15, 0.0, 0.0, 98.01, 97.83, 0.0, 87.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.48, 1.21, 9.2, 1.91, 1.98, 5.56, 8.91, 0.5, 2.91, 1.91, 2.45, 1.78, 1.72, 4.34, 3.12, 1.17, 3.38, 3.34, 2.76, 1.58, 4.71, 0.79, 2.87, 1.29, 0.99, 3.97, 2.69, 1.7, 1.88, 2.76, 4.65, 1.72, 8.49]} \ No newline at end of file diff --git a/annotations_filtered/kP6EOOdTQP8_filtered.json b/annotations_filtered/kP6EOOdTQP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1431039aeb32ca16e73d22217a1049eed9db24fb --- /dev/null +++ b/annotations_filtered/kP6EOOdTQP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.93], [8.0, 9.68], [10.0, 10.52], [13.0, 22.52], [24.0, 26.89], [30.0, 32.75], [35.0, 63.68], [68.0, 69.18]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [50.06, 0.0, 0.0, 37.96, 44.99, 53.4, 30.5, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 54.94], ["music", 27.83], ["thunk", 9.44]], [["music", 42.01], ["speech", 7.33], ["guitar", 5.3]], null, [["music", 67.66], ["speech", 6.07], ["thunk", 3.46]], null], "duration": [4.93, 1.68, 0.52, 9.52, 2.89, 2.75, 28.68, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/kPE7ZCGjw4o_filtered.json b/annotations_filtered/kPE7ZCGjw4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b3e79024c3b049f99959d069627b091af09ad6 --- /dev/null +++ b/annotations_filtered/kPE7ZCGjw4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.27], [7.0, 27.01], [30.0, 41.37], [47.0, 48.19], [54.0, 56.12], [60.0, 60.0], [61.0, 61.32], [62.0, 65.69], [67.0, 67.32], [83.0, 83.94], [99.0, 99.3], [99.0, 99.77], [100.0, 107.18], [109.0, 117.91], [120.0, 125.46], [126.0, 125.71], [126.0, 129.07], [131.0, 132.83], [136.0, 136.41], [141.0, 142.33], [159.0, 159.21], [165.0, 168.74], [170.0, 171.05], [172.0, 172.5], [173.0, 173.8], [179.0, 179.49], [180.0, 185.46], [187.0, 195.2], [196.0, 196.08], [197.0, 196.75], [199.0, 198.8], [200.0, 200.35], [204.0, 204.87], [207.0, 207.66], [212.0, 214.91], [216.0, 217.24]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.6, 34.14, 0.0, 31.48, 0.0, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 34.03, 34.65, 39.47, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 33.38, 48.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.09, 0.0], "audiomae_on_audioset": [null, [["music", 69.13], ["speech", 18.15], ["throbbing", 3.53]], [["speech", 38.44], ["animal", 8.62], ["music", 5.31]], null, [["music", 62.96], ["speech", 15.16], ["skidding", 1.07]], null, null, [["speech", 58.35], ["music", 19.33], ["didgeridoo", 2.4]], null, null, null, null, [["music", 71.09], ["speech", 4.31], ["fart", 2.94]], [["music", 42.92], ["speech", 9.95], ["throbbing", 5.18]], [["speech", 53.49], ["crack", 13.34], ["sidetone", 12.66]], null, null, null, null, null, null, null, null, null, null, null, [["roar", 42.3], ["creak", 19.98], ["whale vocalization", 6.75]], [["music", 51.24], ["fly, housefly", 8.73], ["mosquito", 7.51]], null, null, null, null, null, null, [["music", 69.96], ["didgeridoo", 2.19], ["wind instrument, woodwind instrument", 1.98]], null], "duration": [0.27, 20.01, 11.37, 1.19, 2.12, 0.0, 0.32, 3.69, 0.32, 0.94, 0.3, 0.77, 7.18, 8.91, 5.46, -0.29, 3.07, 1.83, 0.41, 1.33, 0.21, 3.74, 1.05, 0.5, 0.8, 0.49, 5.46, 8.2, 0.08, -0.25, -0.2, 0.35, 0.87, 0.66, 2.91, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/kPHbIyDTPHU_filtered.json b/annotations_filtered/kPHbIyDTPHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef88c251e97ae43f779d2a38cfa9b1ffc78c1216 --- /dev/null +++ b/annotations_filtered/kPHbIyDTPHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.9], [11.0, 11.82], [12.0, 13.07], [15.0, 14.67], [16.0, 16.58], [22.0, 22.6], [24.0, 24.27], [25.0, 25.81], [27.0, 29.37], [31.0, 41.12], [43.0, 43.63], [45.0, 45.57], [47.0, 48.63], [50.0, 50.33], [51.0, 52.79], [55.0, 57.18], [59.0, 59.29], [62.0, 63.41], [64.0, 65.31], [68.0, 68.03], [76.0, 76.18], [77.0, 78.78], [81.0, 81.78], [82.0, 84.55], [86.0, 86.34], [89.0, 93.02], [95.0, 95.66], [98.0, 98.81], [99.0, 100.18], [102.0, 102.32], [103.0, 106.37], [108.0, 110.83], [112.0, 112.51], [113.0, 113.41], [115.0, 115.99], [117.0, 118.15], [119.0, 120.01], [122.0, 123.28], [124.0, 125.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 0.82, 1.07, -0.33, 0.58, 0.6, 0.27, 0.81, 2.37, 10.12, 0.63, 0.57, 1.63, 0.33, 1.79, 2.18, 0.29, 1.41, 1.31, 0.03, 0.18, 1.78, 0.78, 2.55, 0.34, 4.02, 0.66, 0.81, 1.18, 0.32, 3.37, 2.83, 0.51, 0.41, 0.99, 1.15, 1.01, 1.28, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/kPNy_yGvpKI_filtered.json b/annotations_filtered/kPNy_yGvpKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4126b8d4f157a070ba94a56a30b75a297cd02ee4 --- /dev/null +++ b/annotations_filtered/kPNy_yGvpKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.81], [15.0, 14.89], [19.0, 19.65], [21.0, 21.3], [25.0, 56.96], [58.0, 58.41], [59.0, 60.15], [62.0, 72.64], [79.0, 100.36], [105.0, 105.71], [106.0, 107.11]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.72, 43.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 39.34], ["cattle, bovinae", 15.26], ["moo", 9.32]], [["speech", 31.95], ["fly, housefly", 8.49], ["hum", 7.32]], null, null], "duration": [1.81, -0.11, 0.65, 0.3, 31.96, 0.41, 1.15, 10.64, 21.36, 0.71, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/kPSk30qzgFs_filtered.json b/annotations_filtered/kPSk30qzgFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50e52f4cce3ff8702e5953d237e4119bc302c2a2 --- /dev/null +++ b/annotations_filtered/kPSk30qzgFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.96], [8.0, 9.98], [11.0, 34.72], [37.0, 71.19]], "keep_status": [false, false, true, false], "silence_prob": [100.0, 0.0, 38.83, 0.0], "audiomae_on_audioset": [null, null, [["music", 43.12], ["busy signal", 8.6], ["hum", 6.25]], null], "duration": [2.96, 1.98, 23.72, 34.19]} \ No newline at end of file diff --git a/annotations_filtered/kPXFWplmSyA_filtered.json b/annotations_filtered/kPXFWplmSyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32f155d20a355d232fa0d2f2e764547f2657a9a5 --- /dev/null +++ b/annotations_filtered/kPXFWplmSyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.48], [26.0, 27.89], [29.0, 30.21], [36.0, 39.72], [41.0, 41.86], [43.0, 43.93], [45.0, 46.16], [47.0, 50.18], [55.0, 55.32], [57.0, 57.59], [59.0, 62.5], [63.0, 63.54], [66.0, 66.56], [68.0, 68.88], [69.0, 72.12], [75.0, 79.08], [83.0, 83.29], [85.0, 88.05], [91.0, 92.72], [95.0, 96.01], [98.0, 100.09], [102.0, 103.52], [105.0, 112.19], [112.0, 112.23], [114.0, 113.68], [114.0, 113.85], [118.0, 129.02], [130.0, 130.92], [132.0, 133.22], [134.0, 134.84], [138.0, 140.17], [144.0, 163.53], [165.0, 165.55], [166.0, 166.8], [167.0, 170.23], [171.0, 176.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.11, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 75.23, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 44.07, 51.71, 0.0, 77.87, 0.0, 0.0, 67.38, 0.0, 32.39, 0.0, 0.0, 0.0, 31.31, 0.0, 0.0, 0.0, 57.48, 52.05, 0.0, 0.0, 61.67, 80.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.38], ["music", 13.76], ["hum", 5.14]], null, null, null, null, null, null, null, [["speech", 51.32], ["radio", 5.86], ["noise", 5.75]], null, null, null, [["music", 53.57], ["cacophony", 10.27], ["speech", 9.07]], null, null, null, null, null, null, null, null, null], "duration": [2.48, 1.89, 1.21, 3.72, 0.86, 0.93, 1.16, 3.18, 0.32, 0.59, 3.5, 0.54, 0.56, 0.88, 3.12, 4.08, 0.29, 3.05, 1.72, 1.01, 2.09, 1.52, 7.19, 0.23, -0.32, -0.15, 11.02, 0.92, 1.22, 0.84, 2.17, 19.53, 0.55, 0.8, 3.23, 5.89]} \ No newline at end of file diff --git a/annotations_filtered/kPiMgLB7S7c_filtered.json b/annotations_filtered/kPiMgLB7S7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..372316319d0aa6ec4c700bfa606ba3236fcaf950 --- /dev/null +++ b/annotations_filtered/kPiMgLB7S7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [9.0, 24.58], [26.0, 28.41], [29.0, 31.53], [32.0, 32.71], [38.0, 40.29], [45.0, 46.31], [48.0, 48.66], [49.0, 49.1], [50.0, 50.33], [65.0, 82.54], [93.0, 94.32], [100.0, 99.94], [102.0, 106.37], [107.0, 118.72], [120.0, 120.87], [124.0, 125.64], [137.0, 139.53], [141.0, 142.45], [143.0, 145.37], [146.0, 168.69]], "keep_status": [false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.38, 30.74, 29.89, 0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 29.89, 0.0, 0.0, 38.84, 55.18, 0.0, 0.0, 37.82, 0.0, 91.64, 67.13], "audiomae_on_audioset": [null, [["hum", 42.94], ["mains hum", 23.44], ["music", 16.86]], [["music", 47.47], ["theremin", 27.44], ["musical instrument", 3.43]], [["speech", 42.81], ["explosion", 12.44], ["whack, thwack", 10.85]], null, [["music", 18.22], ["speech", 14.48], ["whoosh, swoosh, swish", 12.7]], null, null, null, null, [["music", 30.84], ["hum", 14.51], ["electronic music", 7.64]], null, null, [["mains hum", 37.07], ["hum", 36.0], ["throbbing", 9.22]], null, null, null, [["hum", 29.83], ["music", 21.79], ["mains hum", 21.09]], null, null, null], "duration": [1.06, 15.58, 2.41, 2.53, 0.71, 2.29, 1.31, 0.66, 0.1, 0.33, 17.54, 1.32, -0.06, 4.37, 11.72, 0.87, 1.64, 2.53, 1.45, 2.37, 22.69]} \ No newline at end of file diff --git a/annotations_filtered/kPsFoudYVSg_filtered.json b/annotations_filtered/kPsFoudYVSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c5278db454de169f40feadb889a79394734385a --- /dev/null +++ b/annotations_filtered/kPsFoudYVSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [5.0, 6.18], [13.0, 13.19], [16.0, 18.01], [20.0, 23.72], [24.0, 26.25], [28.0, 28.92], [32.0, 35.16], [36.0, 43.07], [49.0, 53.0], [56.0, 59.04], [61.0, 76.11], [78.0, 79.17], [81.0, 81.97], [83.0, 98.98], [99.0, 99.23], [99.0, 104.01], [105.0, 108.43], [110.0, 114.99], [118.0, 153.5], [156.0, 155.85], [156.0, 156.03], [156.0, 156.36], [157.0, 163.59], [165.0, 166.35], [168.0, 168.32], [171.0, 171.63]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.28, 33.0, 33.86, 0.0, 40.48, 35.5, 29.85, 30.89, 34.83, 0.0, 0.0, 91.98, 0.0, 57.48, 71.87, 42.72, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["clang", 36.37], ["crushing", 28.41], ["breaking", 8.99]], [["sidetone", 49.62], ["speech", 15.11], ["hum", 12.11]], null, [["gong", 74.73], ["music", 6.39], ["hum", 5.39]], [["music", 36.0], ["throbbing", 20.22], ["hum", 8.77]], [["music", 84.72], ["throbbing", 1.47], ["boing", 1.43]], [["music", 36.28], ["throbbing", 32.71], ["cowbell", 5.28]], [["speech", 41.46], ["sidetone", 27.15], ["music", 7.99]], null, null, null, null, null, null, [["noise", 29.19], ["throbbing", 11.95], ["hum", 11.64]], null, null, null, null, null, null, null, null], "duration": [0.94, 1.18, 0.19, 2.01, 3.72, 2.25, 0.92, 3.16, 7.07, 4.0, 3.04, 15.11, 1.17, 0.97, 15.98, 0.23, 5.01, 3.43, 4.99, 35.5, -0.15, 0.03, 0.36, 6.59, 1.35, 0.32, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/kQ65F_pf868_filtered.json b/annotations_filtered/kQ65F_pf868_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4da0ead73c19b3abb0c36d05203844cce3eabd71 --- /dev/null +++ b/annotations_filtered/kQ65F_pf868_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [19.0, 24.97], [29.0, 29.83], [36.0, 54.89], [78.0, 83.81], [85.0, 85.97]], "keep_status": [false, true, false, true, true, false], "silence_prob": [0.0, 34.93, 0.0, 34.22, 39.46, 0.0], "audiomae_on_audioset": [null, [["speech", 49.99], ["music", 9.56], ["boing", 6.7]], null, [["music", 11.74], ["fly, housefly", 9.13], ["hum", 9.0]], [["music", 42.01], ["electronic music", 8.38], ["ambient music", 6.78]], null], "duration": [1.68, 5.97, 0.83, 18.89, 5.81, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/kQ6BSOZ0VGQ_filtered.json b/annotations_filtered/kQ6BSOZ0VGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b88b9b3f98e2dbbbf39cd938a7d5dde3276fc7f --- /dev/null +++ b/annotations_filtered/kQ6BSOZ0VGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.01], [19.0, 27.7], [29.0, 29.44], [36.0, 43.97], [56.0, 56.27], [59.0, 59.83], [62.0, 75.34], [76.0, 92.01], [100.0, 101.36], [102.0, 103.54]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 33.0, 0.0, 33.85, 0.0, 0.0, 38.74, 99.4, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 73.69], ["didgeridoo", 5.44], ["synthesizer", 4.57]], null, [["music", 66.39], ["didgeridoo", 8.56], ["synthesizer", 4.68]], null, null, [["music", 31.25], ["theremin", 21.77], ["whale vocalization", 12.68]], null, null, null], "duration": [0.01, 8.7, 0.44, 7.97, 0.27, 0.83, 13.34, 16.01, 1.36, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/kQI3S3inEXg_filtered.json b/annotations_filtered/kQI3S3inEXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a78d7a484ab4bb7e92b2d2238fb4e986cfd66b95 --- /dev/null +++ b/annotations_filtered/kQI3S3inEXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.04], [20.0, 21.49], [25.0, 28.71], [30.0, 31.28], [33.0, 33.45], [35.0, 37.42], [38.0, 40.44], [41.0, 43.11], [44.0, 45.62], [47.0, 51.38], [52.0, 56.67], [57.0, 68.91], [70.0, 74.38], [75.0, 75.95], [77.0, 96.7], [97.0, 97.23], [97.0, 121.64], [124.0, 124.78], [125.0, 131.09], [133.0, 133.52], [134.0, 135.33], [137.0, 139.82], [141.0, 142.21], [143.0, 150.55], [152.0, 155.09], [156.0, 158.38], [161.0, 164.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.93, 0.0, 100.0, 0.0, 0.0, 99.44, 100.0, 100.0, 0.0, 99.78, 100.0, 97.43, 94.95, 0.0, 91.81, 0.0, 80.11, 0.0, 98.36, 0.0, 0.0, 99.9, 0.0, 95.23, 90.95, 95.91, 90.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.04, 1.49, 3.71, 1.28, 0.45, 2.42, 2.44, 2.11, 1.62, 4.38, 4.67, 11.91, 4.38, 0.95, 19.7, 0.23, 24.64, 0.78, 6.09, 0.52, 1.33, 2.82, 1.21, 7.55, 3.09, 2.38, 3.79]} \ No newline at end of file diff --git a/annotations_filtered/kQQfoIy7SNI_filtered.json b/annotations_filtered/kQQfoIy7SNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd9f285b5a17d6b8790d880042ea75099cc1f983 --- /dev/null +++ b/annotations_filtered/kQQfoIy7SNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 34.69], [35.0, 34.72], [35.0, 37.42], [39.0, 40.37]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 33.3, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.8], ["animal", 11.98], ["throbbing", 7.06]], null], "duration": [32.69, -0.28, 2.42, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/kQoFdaWI4h8_filtered.json b/annotations_filtered/kQoFdaWI4h8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdc8ae2dd9dbc0a74cf1931b3ec93069c2b60a9e --- /dev/null +++ b/annotations_filtered/kQoFdaWI4h8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.86], [9.0, 10.07], [12.0, 13.53], [18.0, 21.2], [24.0, 24.93], [27.0, 58.92], [60.0, 72.1], [74.0, 74.56], [77.0, 78.68], [81.0, 110.1], [112.0, 119.18], [129.0, 129.32], [131.0, 130.74]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 34.48, 0.0, 0.0, 32.58, 48.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 32.34], ["animal", 20.14], ["bow-wow", 4.8]], null, null, [["music", 56.79], ["fart", 6.76], ["speech", 6.63]], [["speech", 49.89], ["hum", 14.47], ["animal", 4.87]], null, null], "duration": [-0.14, 1.07, 1.53, 3.2, 0.93, 31.92, 12.1, 0.56, 1.68, 29.1, 7.18, 0.32, -0.26]} \ No newline at end of file diff --git a/annotations_filtered/kQrU0KRsCNo_filtered.json b/annotations_filtered/kQrU0KRsCNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..053e620b2f88a657fe7177f2968108c9448071db --- /dev/null +++ b/annotations_filtered/kQrU0KRsCNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.7], [14.0, 26.57], [28.0, 29.71], [30.0, 31.68], [33.0, 37.94], [40.0, 40.73], [41.0, 42.11], [44.0, 45.39], [47.0, 48.27], [51.0, 52.95], [55.0, 56.02], [58.0, 58.72], [61.0, 61.87], [63.0, 65.04], [66.0, 66.53], [68.0, 68.98], [71.0, 102.37], [103.0, 125.83], [130.0, 131.33], [133.0, 136.75], [139.0, 140.36], [145.0, 150.25], [151.0, 153.12], [155.0, 155.93], [160.0, 162.35], [163.0, 169.43]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 69.47, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 52.86, 0.0, 59.51, 0.0, 39.24, 63.53, 0.0, 62.99, 54.23], "audiomae_on_audioset": [null, null, null, null, [["music", 48.49], ["frog", 9.66], ["speech", 5.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.61], ["quack", 13.14], ["duck", 3.16]], null, null, null, null], "duration": [0.7, 12.57, 1.71, 1.68, 4.94, 0.73, 1.11, 1.39, 1.27, 1.95, 1.02, 0.72, 0.87, 2.04, 0.53, 0.98, 31.37, 22.83, 1.33, 3.75, 1.36, 5.25, 2.12, 0.93, 2.35, 6.43]} \ No newline at end of file diff --git a/annotations_filtered/kR8Xje2x0sA_filtered.json b/annotations_filtered/kR8Xje2x0sA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42959b8d075401a7d7b723619553c86dd9846c61 --- /dev/null +++ b/annotations_filtered/kR8Xje2x0sA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [7.0, 8.31], [13.0, 14.07], [16.0, 17.37], [20.0, 20.46], [40.0, 40.37], [45.0, 45.13], [52.0, 59.1], [59.0, 61.06], [62.0, 62.75], [63.0, 67.34], [71.0, 73.79], [77.0, 84.75], [86.0, 87.29], [88.0, 90.91], [96.0, 98.64], [101.0, 101.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 89.36, 0.0, 76.53, 70.02, 70.44, 0.0, 80.11, 45.49, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 45.91], ["mains hum", 18.6], ["music", 16.41]], null], "duration": [1.56, 1.31, 1.07, 1.37, 0.46, 0.37, 0.13, 7.1, 2.06, 0.75, 4.34, 2.79, 7.75, 1.29, 2.91, 2.64, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/kRNhyHiBUXs_filtered.json b/annotations_filtered/kRNhyHiBUXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e54b964e1f47cf9f3882dfba060b49f104d4c0 --- /dev/null +++ b/annotations_filtered/kRNhyHiBUXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [20.0, 22.18], [23.0, 24.06], [25.0, 26.84], [35.0, 35.45], [43.0, 43.24], [49.0, 48.95], [50.0, 51.02], [59.0, 59.81], [61.0, 62.61], [82.0, 83.52], [86.0, 86.97], [102.0, 102.63], [104.0, 105.78], [109.0, 109.56], [110.0, 112.73], [114.0, 114.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 2.18, 1.06, 1.84, 0.45, 0.24, -0.05, 1.02, 0.81, 1.61, 1.52, 0.97, 0.63, 1.78, 0.56, 2.73, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/kRWvfBinmWw_filtered.json b/annotations_filtered/kRWvfBinmWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe2891c7264f3631a73ba97e0bb6b689064bc348 --- /dev/null +++ b/annotations_filtered/kRWvfBinmWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.29], [22.0, 22.71], [23.0, 23.67], [24.0, 24.8], [25.0, 25.83], [26.0, 26.96], [27.0, 27.94], [28.0, 29.02], [29.0, 30.03], [30.0, 32.12], [32.0, 33.44], [36.0, 66.28], [69.0, 78.12], [84.0, 98.56], [101.0, 108.57], [111.0, 112.67], [115.0, 115.32], [123.0, 122.94], [125.0, 125.63], [129.0, 129.96], [132.0, 132.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 54.63, 36.98, 75.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.7], ["mains hum", 16.62], ["white noise", 6.78]], null, null, null, null, null, null, null], "duration": [0.29, 0.71, 0.67, 0.8, 0.83, 0.96, 0.94, 1.02, 1.03, 2.12, 1.44, 30.28, 9.12, 14.56, 7.57, 1.67, 0.32, -0.06, 0.63, 0.96, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/kReNcBdLDa8_filtered.json b/annotations_filtered/kReNcBdLDa8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..537bd156a16489c02e221a9fecbe3e897ee788a3 --- /dev/null +++ b/annotations_filtered/kReNcBdLDa8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.03], [17.0, 17.64], [20.0, 21.07], [35.0, 34.77], [36.0, 37.49], [38.0, 38.58]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.03, 0.64, 1.07, -0.23, 1.49, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/kRg5-TIF9LQ_filtered.json b/annotations_filtered/kRg5-TIF9LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62773f8b73489197d1223ba6688b614c848c18ab --- /dev/null +++ b/annotations_filtered/kRg5-TIF9LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [8.0, 9.05], [10.0, 10.47], [12.0, 12.02], [14.0, 14.86], [16.0, 18.81], [21.0, 22.6], [26.0, 26.45], [29.0, 30.75], [33.0, 33.83], [35.0, 35.88], [36.0, 38.69], [40.0, 41.3], [43.0, 49.11], [50.0, 60.24], [62.0, 63.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 83.7, 50.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 1.05, 0.47, 0.02, 0.86, 2.81, 1.6, 0.45, 1.75, 0.83, 0.88, 2.69, 1.3, 6.11, 10.24, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/kRuKg_khl8Q_filtered.json b/annotations_filtered/kRuKg_khl8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..435795a403c3dba48e06fe55754bb56363bacc1c --- /dev/null +++ b/annotations_filtered/kRuKg_khl8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.68], [22.0, 25.08], [28.0, 28.27], [31.0, 39.16], [45.0, 48.17], [54.0, 55.14], [55.0, 55.17], [55.0, 55.21], [55.0, 55.34], [55.0, 55.49], [58.0, 61.45], [65.0, 66.8], [68.0, 68.66], [69.0, 69.57], [72.0, 71.73], [72.0, 83.44], [92.0, 100.65], [103.0, 108.6], [111.0, 110.86], [111.0, 114.3], [122.0, 121.9], [123.0, 124.77], [127.0, 129.81], [130.0, 131.11], [134.0, 139.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [59.33, 52.45, 0.0, 53.28, 43.45, 0.0, 0.0, 0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 38.62, 36.52, 39.6, 0.0, 90.43, 0.0, 0.0, 71.43, 0.0, 87.19], "audiomae_on_audioset": [null, null, null, null, [["music", 59.95], ["bass guitar", 7.16], ["guitar", 5.7]], null, null, null, null, null, [["music", 84.01], ["musical instrument", 2.45], ["guitar", 1.47]], null, null, null, null, [["music", 83.26], ["bass guitar", 4.38], ["musical instrument", 1.57]], [["music", 87.96], ["musical instrument", 1.3], ["soundtrack music", 0.41]], [["music", 42.41], ["bass guitar", 8.44], ["guitar", 8.18]], null, null, null, null, null, null, null], "duration": [5.68, 3.08, 0.27, 8.16, 3.17, 1.14, 0.17, 0.21, 0.34, 0.49, 3.45, 1.8, 0.66, 0.57, -0.27, 11.44, 8.65, 5.6, -0.14, 3.3, -0.1, 1.77, 2.81, 1.11, 5.67]} \ No newline at end of file diff --git a/annotations_filtered/kRwFOUeh-Ro_filtered.json b/annotations_filtered/kRwFOUeh-Ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb8a6fcfe667d80d33a087c0a6acac2482aae9e7 --- /dev/null +++ b/annotations_filtered/kRwFOUeh-Ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.39], [14.0, 14.1], [19.0, 19.28], [25.0, 24.8], [26.0, 25.98], [28.0, 29.1], [30.0, 30.27]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.39, 0.1, 0.28, -0.2, -0.02, 1.1, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/kSQaXjYkZpc_filtered.json b/annotations_filtered/kSQaXjYkZpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc142c942463220d1db8f25574c01043fe596d1 --- /dev/null +++ b/annotations_filtered/kSQaXjYkZpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 21.47], [29.0, 48.96], [63.0, 63.68], [76.0, 87.22], [90.0, 94.34], [100.0, 100.57], [113.0, 122.81], [124.0, 124.38], [127.0, 133.17], [138.0, 143.04], [146.0, 148.86], [149.0, 159.26], [163.0, 163.58], [165.0, 166.6], [168.0, 172.64]], "keep_status": [true, true, false, true, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [29.67, 29.43, 0.0, 29.07, 31.15, 0.0, 29.8, 0.0, 31.24, 30.51, 28.81, 30.4, 0.0, 0.0, 30.69], "audiomae_on_audioset": [[["speech", 31.9], ["music", 18.68], ["boing", 16.88]], [["livestock, farm animals, working animals", 24.51], ["cattle, bovinae", 23.1], ["moo", 13.79]], null, [["music", 45.43], ["speech", 4.91], ["sound effect", 4.81]], [["music", 34.68], ["speech", 33.7], ["sidetone", 3.17]], null, [["speech", 59.46], ["music", 16.32], ["outside, rural or natural", 2.79]], null, [["music", 52.74], ["cattle, bovinae", 5.07], ["moo", 4.95]], [["cattle, bovinae", 44.85], ["moo", 21.23], ["livestock, farm animals, working animals", 7.82]], [["music", 36.57], ["mosquito", 15.94], ["fly, housefly", 12.35]], [["music", 39.51], ["speech", 35.93], ["vehicle", 1.96]], null, null, [["music", 18.81], ["hum", 12.46], ["noise", 11.6]]], "duration": [16.47, 19.96, 0.68, 11.22, 4.34, 0.57, 9.81, 0.38, 6.17, 5.04, 2.86, 10.26, 0.58, 1.6, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/kS_QskTI8WI_filtered.json b/annotations_filtered/kS_QskTI8WI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40e9defc43bc143c78aa810cf451971b319a9e09 --- /dev/null +++ b/annotations_filtered/kS_QskTI8WI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 47.22], [50.0, 54.94], [62.0, 80.77], [81.0, 84.55], [86.0, 87.08], [88.0, 95.34], [99.0, 100.35], [101.0, 104.85], [106.0, 106.46], [109.0, 124.95], [127.0, 128.11], [133.0, 139.26], [141.0, 142.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.04, 65.67, 59.15, 83.16, 0.0, 72.46, 0.0, 63.42, 0.0, 51.18, 0.0, 65.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.22, 4.94, 18.77, 3.55, 1.08, 7.34, 1.35, 3.85, 0.46, 15.95, 1.11, 6.26, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/kSaOMRXiLVA_filtered.json b/annotations_filtered/kSaOMRXiLVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..247eb6fb9fb8e59911cbe7f7a1241b08363f2bed --- /dev/null +++ b/annotations_filtered/kSaOMRXiLVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.19], [16.0, 17.32], [18.0, 18.49], [27.0, 27.99], [29.0, 29.25], [31.0, 36.66], [41.0, 41.76], [43.0, 46.94], [48.0, 49.81], [51.0, 77.21], [79.0, 84.84], [89.0, 96.06], [97.0, 98.71], [103.0, 113.14], [116.0, 116.94], [120.0, 123.67]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.84, 0.0, 39.8, 0.0, 29.6, 31.05, 36.58, 0.0, 44.26, 0.0, 57.17], "audiomae_on_audioset": [null, null, null, null, null, [["music", 53.26], ["theremin", 11.21], ["effects unit", 7.9]], null, [["hum", 36.13], ["mains hum", 15.25], ["speech", 11.32]], null, [["music", 61.47], ["speech", 10.93], ["synthesizer", 4.6]], [["music", 47.31], ["sidetone", 11.93], ["speech", 10.59]], [["music", 39.43], ["fart", 4.57], ["synthesizer", 4.18]], null, [["insect", 39.31], ["music", 13.61], ["mosquito", 9.17]], null, null], "duration": [1.19, 1.32, 0.49, 0.99, 0.25, 5.66, 0.76, 3.94, 1.81, 26.21, 5.84, 7.06, 1.71, 10.14, 0.94, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/kSk0pCs4pGQ_filtered.json b/annotations_filtered/kSk0pCs4pGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ea1b4c742c43f18e3653ee0d978163009e5e81 --- /dev/null +++ b/annotations_filtered/kSk0pCs4pGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [3.0, 6.15], [8.0, 9.37], [11.0, 11.03], [16.0, 16.11], [17.0, 17.61], [27.0, 28.71], [35.0, 35.51], [37.0, 38.69], [41.0, 42.03], [44.0, 49.98], [58.0, 62.23], [74.0, 78.95], [79.0, 80.27], [81.0, 80.67], [84.0, 88.91], [102.0, 106.27], [115.0, 117.51], [119.0, 119.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, true, false], "silence_prob": [0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.34, 32.01, 29.06, 0.0, 0.0, 39.11, 29.11, 45.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 19.88], ["mains hum", 16.02], ["speech", 15.55]], [["music", 48.21], ["speech", 10.08], ["scary music", 3.6]], [["speech", 51.83], ["music", 11.77], ["dog", 3.2]], null, null, [["music", 43.07], ["speech", 7.58], ["sine wave", 4.14]], [["speech", 66.01], ["music", 8.98], ["inside, small room", 2.12]], [["speech", 60.4], ["cattle, bovinae", 4.21], ["animal", 4.18]], null], "duration": [0.7, 3.15, 1.37, 0.03, 0.11, 0.61, 1.71, 0.51, 1.69, 1.03, 5.98, 4.23, 4.95, 1.27, -0.33, 4.91, 4.27, 2.51, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/kSmAfIP9CoQ_filtered.json b/annotations_filtered/kSmAfIP9CoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4928f950ca646f4c00d6cdd08218ad887e6e50dd --- /dev/null +++ b/annotations_filtered/kSmAfIP9CoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [12.0, 12.36], [14.0, 15.16], [19.0, 19.65], [22.0, 25.61], [28.0, 28.49], [30.0, 31.67], [33.0, 33.99], [36.0, 35.82], [39.0, 42.65], [44.0, 49.4], [50.0, 55.34], [57.0, 59.61], [62.0, 83.39], [84.0, 98.46], [102.0, 103.01], [104.0, 103.92], [104.0, 145.23], [146.0, 146.42]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false], "silence_prob": [40.28, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 0.0, 0.0, 34.82, 33.4, 33.1, 33.36, 32.42, 34.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.14], ["pulse", 5.68], ["croak", 2.68]], null, null, null, [["music", 63.73], ["hum", 3.2], ["ambient music", 3.18]], null, null, null, null, [["music", 23.42], ["mains hum", 23.38], ["hum", 18.4]], [["speech", 33.26], ["vehicle", 12.49], ["hum", 8.34]], [["hum", 24.01], ["music", 23.56], ["mains hum", 10.87]], [["music", 45.47], ["whip", 11.61], ["electronic music", 4.0]], [["music", 67.37], ["electronic music", 5.38], ["speech", 5.06]], [["hum", 36.58], ["mains hum", 25.09], ["throbbing", 22.45]], null, null, null, null], "duration": [2.21, 0.36, 1.16, 0.65, 3.61, 0.49, 1.67, 0.99, -0.18, 3.65, 5.4, 5.34, 2.61, 21.39, 14.46, 1.01, -0.08, 41.23, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/kSyIRLpdmlA_filtered.json b/annotations_filtered/kSyIRLpdmlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aade58806a1d9d782185872505ed2edf27b0a15b --- /dev/null +++ b/annotations_filtered/kSyIRLpdmlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.11], [20.0, 20.46], [21.0, 22.28], [23.0, 25.1], [26.0, 33.74], [42.0, 52.51], [55.0, 71.37], [73.0, 76.35], [78.0, 80.37], [81.0, 84.03], [87.0, 88.38], [90.0, 93.43], [94.0, 95.35], [99.0, 102.14], [103.0, 103.65], [110.0, 110.84], [114.0, 117.9], [119.0, 120.61], [122.0, 123.58], [125.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 98.19, 100.0, 99.99, 100.0, 99.98, 100.0, 100.0, 0.0, 99.97, 0.0, 95.78, 0.0, 0.0, 91.81, 0.0, 0.0, 45.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.38], ["musical instrument", 10.3], ["drum machine", 8.28]]], "duration": [1.11, 0.46, 1.28, 2.1, 7.74, 10.51, 16.37, 3.35, 2.37, 3.03, 1.38, 3.43, 1.35, 3.14, 0.65, 0.84, 3.9, 1.61, 1.58, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/kTKIACVqDzQ_filtered.json b/annotations_filtered/kTKIACVqDzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f1f181c05a03e5a12b6b265218e78946adaa706 --- /dev/null +++ b/annotations_filtered/kTKIACVqDzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 25.17], [26.0, 26.79], [30.0, 32.32], [33.0, 36.19], [37.0, 47.17], [48.0, 56.19], [58.0, 62.95], [64.0, 70.78], [71.0, 73.7], [76.0, 78.98], [81.0, 84.38], [86.0, 90.19], [92.0, 92.57], [95.0, 104.58], [108.0, 109.61], [110.0, 111.69], [112.0, 117.56], [119.0, 122.66], [126.0, 130.81], [132.0, 136.38], [139.0, 145.99], [147.0, 148.27], [151.0, 152.52], [154.0, 157.23], [158.0, 159.24], [161.0, 162.9], [166.0, 166.5], [167.0, 169.55], [170.0, 171.78], [172.0, 171.86], [172.0, 172.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 0.0, 99.73, 99.9, 98.99, 74.76, 81.35, 54.97, 97.73, 93.76, 99.48, 88.28, 0.0, 78.04, 0.0, 0.0, 93.91, 91.13, 98.19, 96.17, 91.98, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.17, 0.79, 2.32, 3.19, 10.17, 8.19, 4.95, 6.78, 2.7, 2.98, 3.38, 4.19, 0.57, 9.58, 1.61, 1.69, 5.56, 3.66, 4.81, 4.38, 6.99, 1.27, 1.52, 3.23, 1.24, 1.9, 0.5, 2.55, 1.78, -0.14, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/kTNDYiONld8_filtered.json b/annotations_filtered/kTNDYiONld8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c5c59500a48559a2e00bf733db7dd1024d33ab --- /dev/null +++ b/annotations_filtered/kTNDYiONld8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 133.96], [134.0, 162.51]], "keep_status": [false, false], "silence_prob": [0.0, 29.04], "audiomae_on_audioset": [null, [["music", 66.75], ["throbbing", 10.65], ["hum", 4.99]]], "duration": [88.96, 28.51]} \ No newline at end of file diff --git a/annotations_filtered/kTUnQubJMoc_filtered.json b/annotations_filtered/kTUnQubJMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e0d249262e4abf6357525c60032f6c16ba3275c --- /dev/null +++ b/annotations_filtered/kTUnQubJMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.67], [26.0, 26.38], [31.0, 32.95], [37.0, 39.46], [40.0, 65.6], [66.0, 67.39], [68.0, 71.85], [72.0, 92.94], [94.0, 111.97], [115.0, 116.92], [118.0, 119.89], [121.0, 121.41], [127.0, 127.67], [129.0, 130.49]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.55, 34.73, 0.0, 98.8, 96.42, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sine wave", 19.76], ["music", 13.78], ["noise", 11.87]], null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.38, 1.95, 2.46, 25.6, 1.39, 3.85, 20.94, 17.97, 1.92, 1.89, 0.41, 0.67, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/kTXppLCyuOk_filtered.json b/annotations_filtered/kTXppLCyuOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7969a2d70868506edf2f3c4a64ec68594945bee0 --- /dev/null +++ b/annotations_filtered/kTXppLCyuOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 39.6], [40.0, 41.4], [44.0, 44.63], [52.0, 59.53], [61.0, 62.88]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 43.03, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 46.98], ["brass instrument", 15.06], ["musical instrument", 6.59]], null], "duration": [-0.4, 1.4, 0.63, 7.53, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/kT_dXxp7eAo_filtered.json b/annotations_filtered/kT_dXxp7eAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..815c10429a1ce3a949595c895f755e086cb11c91 --- /dev/null +++ b/annotations_filtered/kT_dXxp7eAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.5], [14.0, 15.01], [16.0, 20.01], [27.0, 30.33], [33.0, 51.02], [52.0, 52.98], [55.0, 56.32], [61.0, 72.25], [76.0, 76.99], [80.0, 92.6], [99.0, 102.03], [103.0, 103.03], [103.0, 103.5], [104.0, 104.53], [105.0, 107.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [41.03, 0.0, 31.08, 35.35, 32.07, 0.0, 0.0, 31.71, 0.0, 32.96, 32.59, 0.0, 0.0, 0.0, 31.0], "audiomae_on_audioset": [[["music", 24.34], ["throbbing", 6.82], ["hum", 4.49]], null, [["music", 60.33], ["sidetone", 7.07], ["throbbing", 4.1]], [["music", 75.78], ["sidetone", 3.3], ["electronic music", 2.34]], [["music", 42.78], ["speech", 31.22], ["throbbing", 2.55]], null, null, [["music", 39.62], ["speech", 23.26], ["hum", 10.08]], null, [["music", 72.83], ["speech", 6.01], ["musical instrument", 3.72]], [["music", 44.87], ["electronic music", 10.81], ["throbbing", 7.29]], null, null, null, [["music", 46.46], ["throbbing", 9.1], ["fly, housefly", 4.98]]], "duration": [2.5, 1.01, 4.01, 3.33, 18.02, 0.98, 1.32, 11.25, 0.99, 12.6, 3.03, 0.03, 0.5, 0.53, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/kTk2jXiuo9s_filtered.json b/annotations_filtered/kTk2jXiuo9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93966682ac0291a8aeb7240c37fcc707303bbd23 --- /dev/null +++ b/annotations_filtered/kTk2jXiuo9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.14], [9.0, 10.25], [22.0, 22.91], [24.0, 23.6], [24.0, 23.7]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.14, 1.25, 0.91, -0.4, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/kTnEyRLMvqk_filtered.json b/annotations_filtered/kTnEyRLMvqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a81c08bfcc9b899de6fba423d41ac5a85730770f --- /dev/null +++ b/annotations_filtered/kTnEyRLMvqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [4.0, 4.89], [7.0, 7.97], [13.0, 20.53], [23.0, 25.62], [27.0, 30.89], [33.0, 39.34], [40.0, 40.41], [41.0, 43.09], [45.0, 52.0], [56.0, 55.75], [56.0, 60.52], [62.0, 71.83], [74.0, 73.94], [83.0, 86.97], [88.0, 88.35], [94.0, 97.8], [99.0, 121.05], [121.0, 122.27], [125.0, 125.17]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.87, 90.95, 31.5, 37.02, 0.0, 38.06, 32.2, 0.0, 31.43, 33.22, 0.0, 48.35, 0.0, 29.54, 53.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.4], ["boing", 34.47], ["musical instrument", 1.36]], [["music", 59.2], ["speech", 14.12], ["musical instrument", 2.0]], null, [["music", 40.08], ["speech", 18.98], ["sidetone", 7.43]], [["moo", 33.98], ["cattle, bovinae", 26.7], ["livestock, farm animals, working animals", 13.77]], null, [["boing", 42.3], ["music", 29.89], ["moo", 5.23]], [["music", 74.23], ["beatboxing", 16.87], ["speech", 1.07]], null, [["music", 31.88], ["speech", 8.1], ["throbbing", 7.49]], null, [["moo", 32.03], ["cattle, bovinae", 27.86], ["livestock, farm animals, working animals", 18.29]], null, null, null], "duration": [-0.04, 0.89, 0.97, 7.53, 2.62, 3.89, 6.34, 0.41, 2.09, 7.0, -0.25, 4.52, 9.83, -0.06, 3.97, 0.35, 3.8, 22.05, 1.27, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/kTtxe4pWpfQ_filtered.json b/annotations_filtered/kTtxe4pWpfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kTtxe4pWpfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kU5tlt5wTcc_filtered.json b/annotations_filtered/kU5tlt5wTcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a16cc458a733d8f3f035bb69fe80f64be945242a --- /dev/null +++ b/annotations_filtered/kU5tlt5wTcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.3], [13.0, 21.15], [23.0, 24.27], [30.0, 31.6], [39.0, 66.56], [69.0, 72.52], [76.0, 86.17], [87.0, 87.84], [88.0, 89.11], [92.0, 92.23], [93.0, 93.95], [95.0, 95.59], [96.0, 105.29], [109.0, 109.36], [109.0, 109.46], [110.0, 112.4], [116.0, 116.29]], "keep_status": [true, false, false, false, true, true, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [30.79, 29.96, 0.0, 0.0, 30.08, 31.32, 30.74, 0.0, 0.0, 0.0, 0.0, 0.0, 32.64, 0.0, 0.0, 39.37, 0.0], "audiomae_on_audioset": [[["speech", 37.52], ["music", 17.69], ["boing", 7.67]], [["speech", 58.38], ["vehicle", 9.83], ["race car, auto racing", 3.21]], null, null, [["music", 30.25], ["speech", 26.82], ["vehicle", 10.94]], [["speech", 38.15], ["vehicle", 13.48], ["hum", 12.62]], [["speech", 54.39], ["vehicle", 14.49], ["music", 6.89]], null, null, null, null, null, [["livestock, farm animals, working animals", 24.73], ["speech", 15.19], ["moo", 13.14]], null, null, [["fireworks", 16.01], ["cattle, bovinae", 11.51], ["speech", 11.44]], null], "duration": [4.3, 8.15, 1.27, 1.6, 27.56, 3.52, 10.17, 0.84, 1.11, 0.23, 0.95, 0.59, 9.29, 0.36, 0.46, 2.4, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/kU74wgKk8lo_filtered.json b/annotations_filtered/kU74wgKk8lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a204622030dc7c55fb08215cf1576f2c3e4d968 --- /dev/null +++ b/annotations_filtered/kU74wgKk8lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.56], [18.0, 20.53], [26.0, 26.08], [28.0, 31.11], [32.0, 32.93], [34.0, 35.21], [39.0, 40.83], [43.0, 43.5], [45.0, 45.1], [49.0, 49.86], [51.0, 52.17], [53.0, 61.65], [63.0, 65.04], [65.0, 83.94], [85.0, 89.65], [92.0, 122.61]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 48.95, 0.0, 36.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 29.62, 30.83, 30.03, 0.0], "audiomae_on_audioset": [null, [["speech", 24.99], ["whale vocalization", 13.64], ["fly, housefly", 9.16]], null, [["speech", 53.42], ["hum", 8.01], ["music", 6.09]], null, null, null, null, null, null, null, null, [["music", 65.77], ["breaking", 12.18], ["thump, thud", 3.5]], [["hum", 23.54], ["speech", 14.82], ["music", 10.5]], [["whale vocalization", 50.8], ["livestock, farm animals, working animals", 12.78], ["music", 7.56]], null], "duration": [0.56, 2.53, 0.08, 3.11, 0.93, 1.21, 1.83, 0.5, 0.1, 0.86, 1.17, 8.65, 2.04, 18.94, 4.65, 30.61]} \ No newline at end of file diff --git a/annotations_filtered/kUAXs0LhD6I_filtered.json b/annotations_filtered/kUAXs0LhD6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..266e057c0b1cf3d14525819afef34de70079475c --- /dev/null +++ b/annotations_filtered/kUAXs0LhD6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [5.0, 6.25], [9.0, 10.62], [11.0, 11.79], [14.0, 14.54], [15.0, 15.82], [18.0, 19.25], [23.0, 24.21], [25.0, 27.68], [30.0, 31.77], [33.0, 34.3], [35.0, 35.23], [38.0, 38.65], [40.0, 41.08], [42.0, 41.91], [44.0, 44.05], [45.0, 45.01], [45.0, 53.1], [54.0, 54.04], [55.0, 55.38], [56.0, 56.46], [57.0, 59.05], [60.0, 60.45], [62.0, 63.53], [66.0, 66.11], [73.0, 73.06], [73.0, 76.72], [77.0, 78.56], [80.0, 79.98], [80.0, 81.99], [85.0, 88.15], [89.0, 90.56], [91.0, 92.15], [101.0, 102.34], [103.0, 103.71], [105.0, 106.34], [108.0, 108.84], [111.0, 112.28], [113.0, 114.12], [123.0, 125.25], [126.0, 128.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 99.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 1.25, 1.62, 0.79, 0.54, 0.82, 1.25, 1.21, 2.68, 1.77, 1.3, 0.23, 0.65, 1.08, -0.09, 0.05, 0.01, 8.1, 0.04, 0.38, 0.46, 2.05, 0.45, 1.53, 0.11, 0.06, 3.72, 1.56, -0.02, 1.99, 3.15, 1.56, 1.15, 1.34, 0.71, 1.34, 0.84, 1.28, 1.12, 2.25, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/kV36CHsDZ_c_filtered.json b/annotations_filtered/kV36CHsDZ_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27b7dac194ae4054466a18dc728e6002d9e6ed96 --- /dev/null +++ b/annotations_filtered/kV36CHsDZ_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[121.0, 125.14], [127.0, 128.26]], "keep_status": [true, false], "silence_prob": [32.44, 0.0], "audiomae_on_audioset": [[["music", 16.45], ["throbbing", 8.48], ["noise", 6.81]], null], "duration": [4.14, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/kVPIOjjbIpY_filtered.json b/annotations_filtered/kVPIOjjbIpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd0c090d6765c8a4b3779329f96ebdba4065bbee --- /dev/null +++ b/annotations_filtered/kVPIOjjbIpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.93], [16.0, 17.2], [20.0, 21.05], [22.0, 22.44], [38.0, 62.68], [64.0, 63.9], [65.0, 65.96], [69.0, 71.05], [75.0, 86.26], [87.0, 94.09], [95.0, 99.79], [103.0, 105.81], [107.0, 113.1], [116.0, 123.87], [125.0, 125.93], [127.0, 127.3], [128.0, 130.74], [131.0, 133.39], [134.0, 134.92], [136.0, 139.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 99.21, 81.71, 81.17, 70.72, 79.24, 88.46, 77.03, 0.0, 0.0, 76.37, 93.29, 0.0, 94.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 1.2, 1.05, 0.44, 24.68, -0.1, 0.96, 2.05, 11.26, 7.09, 4.79, 2.81, 6.1, 7.87, 0.93, 0.3, 2.74, 2.39, 0.92, 3.92]} \ No newline at end of file diff --git a/annotations_filtered/kVXAITzqSgc_filtered.json b/annotations_filtered/kVXAITzqSgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a0fb0c09f75be9461f15432a6850a5b42ec59b5 --- /dev/null +++ b/annotations_filtered/kVXAITzqSgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.87], [29.0, 44.9], [54.0, 54.67], [61.0, 97.02], [98.0, 100.09], [103.0, 119.5], [120.0, 124.63], [126.0, 127.04], [127.0, 136.58], [137.0, 137.98], [139.0, 140.29], [143.0, 143.33], [144.0, 150.26], [150.0, 150.45], [150.0, 153.12]], "keep_status": [false, true, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.48, 0.0, 0.0, 36.83, 34.69, 35.73, 0.0, 38.23, 0.0, 0.0, 0.0, 48.95, 0.0, 45.95], "audiomae_on_audioset": [null, [["music", 26.69], ["cello", 18.84], ["double bass", 16.61]], null, null, [["music", 29.45], ["double bass", 14.56], ["musical instrument", 9.45]], [["music", 46.84], ["foghorn", 19.84], ["double bass", 6.98]], [["music", 56.95], ["double bass", 7.57], ["cello", 6.71]], null, [["music", 53.8], ["foghorn", 7.46], ["synthesizer", 5.79]], null, null, null, [["music", 67.51], ["theremin", 4.85], ["musical instrument", 3.06]], null, [["music", 47.66], ["theremin", 24.68], ["musical instrument", 6.88]]], "duration": [-0.13, 15.9, 0.67, 36.02, 2.09, 16.5, 4.63, 1.04, 9.58, 0.98, 1.29, 0.33, 6.26, 0.45, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/kVbmTKqZ31M_filtered.json b/annotations_filtered/kVbmTKqZ31M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a00a605d4c2710e835281435810e0616cca93e9 --- /dev/null +++ b/annotations_filtered/kVbmTKqZ31M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.94], [11.0, 11.8], [13.0, 17.39], [19.0, 24.17], [25.0, 32.85], [34.0, 35.8], [37.0, 42.87], [47.0, 50.48], [51.0, 55.78], [58.0, 58.92], [61.0, 62.18], [63.0, 64.81], [66.0, 72.2], [73.0, 74.49], [76.0, 76.35], [78.0, 81.51], [86.0, 86.78], [89.0, 93.46]], "keep_status": [true, false, true, true, true, false, true, true, true, false, false, false, true, false, false, true, false, true], "silence_prob": [43.43, 0.0, 44.93, 36.73, 39.91, 0.0, 36.47, 48.74, 35.84, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 39.24, 0.0, 41.03], "audiomae_on_audioset": [[["music", 36.62], ["sonar", 25.49], ["whale vocalization", 4.23]], null, [["sine wave", 25.21], ["hum", 24.36], ["chirp tone", 12.02]], [["hum", 18.12], ["sonar", 14.22], ["music", 13.98]], [["sonar", 28.09], ["hum", 26.91], ["music", 11.04]], null, [["throbbing", 22.98], ["rumble", 14.12], ["hum", 14.04]], [["music", 22.65], ["speech", 21.68], ["rumble", 5.53]], [["speech", 38.4], ["music", 9.2], ["hum", 9.15]], null, null, null, [["speech", 31.49], ["gong", 12.54], ["music", 11.5]], null, null, [["speech", 32.32], ["music", 18.91], ["whale vocalization", 5.07]], null, [["music", 53.33], ["musical instrument", 4.39], ["theremin", 4.02]]], "duration": [3.94, 0.8, 4.39, 5.17, 7.85, 1.8, 5.87, 3.48, 4.78, 0.92, 1.18, 1.81, 6.2, 1.49, 0.35, 3.51, 0.78, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/kVujmsfAIUk_filtered.json b/annotations_filtered/kVujmsfAIUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..effd36ef0659e2f3bf200f7979f89bf4e6bf3904 --- /dev/null +++ b/annotations_filtered/kVujmsfAIUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.11], [26.0, 27.11], [28.0, 47.75], [48.0, 48.93], [51.0, 51.63], [54.0, 54.55], [55.0, 56.32], [58.0, 64.03], [65.0, 65.74], [70.0, 70.24], [71.0, 71.39], [80.0, 80.15], [82.0, 81.84], [83.0, 87.56], [89.0, 89.67], [99.0, 99.5], [102.0, 102.9], [110.0, 114.91], [117.0, 117.44], [125.0, 125.56], [127.0, 127.68], [131.0, 131.45], [132.0, 136.61], [137.0, 136.71], [137.0, 137.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0, 0.0, 40.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 60.48], ["sidetone", 13.09], ["noise", 10.35]], null, null, null, null, null, [["speech", 77.13], ["sidetone", 5.67], ["speech synthesizer", 5.23]], null, null, null, [["speech", 78.7], ["sidetone", 2.03], ["grunt", 1.56]], null, null, null, null, [["speech", 71.56], ["radio", 8.18], ["male speech, man speaking", 3.25]], null, null], "duration": [1.11, 1.11, 19.75, 0.93, 0.63, 0.55, 1.32, 6.03, 0.74, 0.24, 0.39, 0.15, -0.16, 4.56, 0.67, 0.5, 0.9, 4.91, 0.44, 0.56, 0.68, 0.45, 4.61, -0.29, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/kW7IPAaL7I4_filtered.json b/annotations_filtered/kW7IPAaL7I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d606252d6c1fa2d4083c2b5550a9f989915f1798 --- /dev/null +++ b/annotations_filtered/kW7IPAaL7I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 40.86], [45.0, 45.3], [46.0, 47.46], [52.0, 52.29], [59.0, 60.37], [65.0, 65.2], [71.0, 71.25], [72.0, 72.12], [74.0, 75.71], [76.0, 76.47], [79.0, 78.65], [81.0, 81.58], [83.0, 84.08], [84.0, 93.04], [96.0, 95.69], [100.0, 100.94], [103.0, 103.62], [104.0, 104.4], [109.0, 111.38], [116.0, 116.67], [120.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.86, 0.3, 1.46, 0.29, 1.37, 0.2, 0.25, 0.12, 1.71, 0.47, -0.35, 0.58, 1.08, 9.04, -0.31, 0.94, 0.62, 0.4, 2.38, 0.67, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/kWHOafRR0Sk_filtered.json b/annotations_filtered/kWHOafRR0Sk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9d8bc2e434f279e6266cab8e84d1d625e022cf4 --- /dev/null +++ b/annotations_filtered/kWHOafRR0Sk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.95], [33.0, 33.32], [34.0, 37.59], [43.0, 43.44], [47.0, 48.61], [50.0, 52.89], [90.0, 91.0]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.71, 0.0, 0.0, 87.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.95, 0.32, 3.59, 0.44, 1.61, 2.89, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/kWPc7z2IMkA_filtered.json b/annotations_filtered/kWPc7z2IMkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c5c133e957a3e2c13114b2feae601617e9e95b9 --- /dev/null +++ b/annotations_filtered/kWPc7z2IMkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.22], [3.0, 16.02], [17.0, 18.79], [19.0, 21.14], [22.0, 24.29], [26.0, 28.17], [29.0, 30.16], [31.0, 34.59], [35.0, 40.19], [41.0, 42.85], [44.0, 47.04], [48.0, 51.48], [54.0, 61.38], [62.0, 75.9], [77.0, 79.73], [81.0, 81.5], [84.0, 85.29], [87.0, 87.24], [89.0, 89.06], [91.0, 91.25], [95.0, 97.34], [98.0, 102.17], [103.0, 106.25], [109.0, 111.15], [113.0, 115.38], [123.0, 124.85], [126.0, 126.93], [129.0, 131.04]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, true, true, true, true, false, false, false, true], "silence_prob": [37.15, 39.99, 0.0, 61.27, 45.33, 61.97, 0.0, 49.31, 71.14, 0.0, 99.76, 92.8, 99.73, 38.3, 39.54, 0.0, 0.0, 0.0, 0.0, 0.0, 35.85, 35.85, 40.59, 35.74, 33.74, 0.0, 0.0, 35.42], "audiomae_on_audioset": [[["sidetone", 22.16], ["music", 13.24], ["chirp tone", 10.63]], [["music", 57.0], ["speech", 20.57], ["didgeridoo", 4.05]], null, null, [["tuning fork", 57.0], ["speech", 12.95], ["sidetone", 7.39]], null, null, [["music", 51.34], ["musical instrument", 10.27], ["speech", 7.09]], null, null, null, null, null, [["speech", 46.6], ["hum", 8.9], ["mains hum", 8.2]], [["music", 29.82], ["gong", 21.18], ["hum", 11.76]], null, null, null, null, null, [["hum", 39.65], ["music", 16.42], ["throbbing", 8.36]], [["music", 30.39], ["throbbing", 11.13], ["speech", 9.29]], [["music", 38.77], ["hum", 9.29], ["throbbing", 6.25]], [["hum", 22.11], ["music", 18.28], ["throbbing", 8.2]], [["music", 34.7], ["speech", 27.73], ["didgeridoo", 26.21]], null, null, [["music", 44.94], ["sidetone", 11.14], ["effects unit", 8.08]]], "duration": [2.22, 13.02, 1.79, 2.14, 2.29, 2.17, 1.16, 3.59, 5.19, 1.85, 3.04, 3.48, 7.38, 13.9, 2.73, 0.5, 1.29, 0.24, 0.06, 0.25, 2.34, 4.17, 3.25, 2.15, 2.38, 1.85, 0.93, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/kWjZx3bSDHI_filtered.json b/annotations_filtered/kWjZx3bSDHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffde3f05147adbe84957341710725397f53e9ec0 --- /dev/null +++ b/annotations_filtered/kWjZx3bSDHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [19.0, 20.8], [22.0, 24.65], [25.0, 26.57], [28.0, 29.64], [31.0, 34.48], [43.0, 43.21], [49.0, 50.57], [53.0, 56.64], [59.0, 60.62], [61.0, 63.29], [64.0, 65.28], [66.0, 68.47], [69.0, 71.56], [72.0, 73.52], [74.0, 82.31], [84.0, 94.0], [97.0, 97.36], [98.0, 104.65], [110.0, 113.17], [116.0, 116.46], [118.0, 120.04], [121.0, 131.11], [132.0, 138.72], [140.0, 140.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.61, 0.0, 0.0, 52.86, 0.0, 0.0, 75.55, 0.0, 53.72, 0.0, 75.55, 77.53, 0.0, 75.07, 65.91, 0.0, 58.22, 83.7, 0.0, 76.53, 78.55, 84.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.8, 2.65, 1.57, 1.64, 3.48, 0.21, 1.57, 3.64, 1.62, 2.29, 1.28, 2.47, 2.56, 1.52, 8.31, 10.0, 0.36, 6.65, 3.17, 0.46, 2.04, 10.11, 6.72, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/kWoC8yYqPJk_filtered.json b/annotations_filtered/kWoC8yYqPJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f7fabacb552a8f9fe0ad97960a31541b9082a00 --- /dev/null +++ b/annotations_filtered/kWoC8yYqPJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.04], [18.0, 20.7], [23.0, 24.48], [28.0, 31.11], [35.0, 37.37], [42.0, 44.47], [45.0, 47.01], [49.0, 51.21], [52.0, 52.47], [66.0, 65.94], [67.0, 68.0], [70.0, 69.89], [71.0, 71.81], [73.0, 73.89], [75.0, 75.39], [77.0, 77.01], [82.0, 83.69], [91.0, 92.23], [93.0, 94.07], [97.0, 97.09]], "keep_status": [false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.53, 0.0, 38.4, 41.7, 53.22, 70.44, 32.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["bleat", 27.02], ["sheep", 24.64], ["oink", 9.07]], null, [["thunk", 58.08], ["sheep", 3.32], ["whack, thwack", 3.15]], [["speech", 25.77], ["throbbing", 21.21], ["heart sounds, heartbeat", 9.61]], null, null, [["whack, thwack", 11.05], ["music", 10.54], ["speech", 10.27]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 2.7, 1.48, 3.11, 2.37, 2.47, 2.01, 2.21, 0.47, -0.06, 1.0, -0.11, 0.81, 0.89, 0.39, 0.01, 1.69, 1.23, 1.07, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/kWrOmEtXk0k_filtered.json b/annotations_filtered/kWrOmEtXk0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d143290f9020a3330f10a3e7c16b99f5a8a9147 --- /dev/null +++ b/annotations_filtered/kWrOmEtXk0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 36.22], [37.0, 39.36], [40.0, 40.59], [44.0, 45.67], [50.0, 53.22], [57.0, 72.82], [76.0, 116.41], [118.0, 120.34], [122.0, 123.77], [126.0, 128.58], [131.0, 134.86], [136.0, 141.79], [149.0, 153.99], [155.0, 159.43], [160.0, 163.66], [168.0, 173.72]], "keep_status": [true, true, false, false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [34.51, 35.26, 0.0, 0.0, 31.49, 31.74, 0.0, 89.72, 0.0, 89.54, 43.33, 65.55, 50.41, 55.46, 37.98, 36.86], "audiomae_on_audioset": [[["music", 34.57], ["theremin", 21.44], ["whip", 10.82]], [["music", 31.8], ["guitar", 6.89], ["plucked string instrument", 5.49]], null, null, [["whip", 80.44], ["whack, thwack", 3.09], ["clang", 2.69]], [["music", 79.08], ["musical instrument", 4.66], ["speech", 2.24]], null, null, null, null, [["music", 49.14], ["musical instrument", 6.01], ["theremin", 5.22]], null, null, null, [["music", 50.02], ["throbbing", 8.35], ["hum", 6.04]], [["music", 27.3], ["sigh", 6.13], ["sound effect", 4.87]]], "duration": [23.22, 2.36, 0.59, 1.67, 3.22, 15.82, 40.41, 2.34, 1.77, 2.58, 3.86, 5.79, 4.99, 4.43, 3.66, 5.72]} \ No newline at end of file diff --git a/annotations_filtered/kXXnZuu72DA_filtered.json b/annotations_filtered/kXXnZuu72DA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaf5cd179e3390457e19e45129f917695172209d --- /dev/null +++ b/annotations_filtered/kXXnZuu72DA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [13.0, 20.41], [21.0, 20.61], [21.0, 20.93], [22.0, 41.2], [42.0, 59.97], [62.0, 78.04], [80.0, 80.22], [81.0, 95.22], [96.0, 96.2], [100.0, 107.42]], "keep_status": [false, true, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 30.78, 0.0, 0.0, 31.54, 30.62, 30.74, 0.0, 30.02, 0.0, 30.79], "audiomae_on_audioset": [null, [["music", 43.16], ["didgeridoo", 17.54], ["animal", 7.38]], null, null, [["music", 63.67], ["speech", 16.1], ["whack, thwack", 3.03]], [["music", 52.41], ["speech", 11.34], ["fly, housefly", 4.39]], [["music", 59.38], ["speech", 4.39], ["musical instrument", 4.11]], null, [["music", 66.07], ["animal", 8.24], ["ding", 2.56]], null, [["music", 42.29], ["trombone", 14.86], ["musical instrument", 6.36]]], "duration": [0.49, 7.41, -0.39, -0.07, 19.2, 17.97, 16.04, 0.22, 14.22, 0.2, 7.42]} \ No newline at end of file diff --git a/annotations_filtered/kXvNxXDDHSY_filtered.json b/annotations_filtered/kXvNxXDDHSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37b88c37d0ab56c0a443e5bda67b1434f32dfe4c --- /dev/null +++ b/annotations_filtered/kXvNxXDDHSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [21.0, 21.78], [24.0, 24.71], [29.0, 29.74], [32.0, 32.88], [41.0, 41.94], [43.0, 42.99], [52.0, 51.75], [64.0, 64.76], [68.0, 69.13], [73.0, 73.48], [81.0, 80.77], [90.0, 90.44], [102.0, 101.88], [124.0, 124.23], [125.0, 126.55], [149.0, 150.6], [152.0, 151.75], [153.0, 159.73], [163.0, 164.52], [166.0, 166.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.63], ["boing", 3.51], ["theremin", 0.91]], null, null], "duration": [0.59, 0.78, 0.71, 0.74, 0.88, 0.94, -0.01, -0.25, 0.76, 1.13, 0.48, -0.23, 0.44, -0.12, 0.23, 1.55, 1.6, -0.25, 6.73, 1.52, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/kXvfBvua7GY_filtered.json b/annotations_filtered/kXvfBvua7GY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9891a4d892d172e9e8fb779c56c288a7ff9d2f8 --- /dev/null +++ b/annotations_filtered/kXvfBvua7GY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [7.0, 8.18], [36.0, 36.48], [42.0, 42.85], [59.0, 59.54]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.16, 1.18, 0.48, 0.85, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/kYA44FTePNQ_filtered.json b/annotations_filtered/kYA44FTePNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7eeebb40641c6b12d96e40d20394c6d426c1b978 --- /dev/null +++ b/annotations_filtered/kYA44FTePNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.29], [15.0, 16.77], [22.0, 24.31], [26.0, 26.74], [28.0, 29.3], [30.0, 31.82], [33.0, 37.15], [38.0, 70.53], [71.0, 76.47], [78.0, 88.45], [89.0, 107.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.37, 0.0, 91.64, 0.0, 0.0, 0.0, 59.15, 0.0, 96.66, 93.45, 54.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.29, 1.77, 2.31, 0.74, 1.3, 1.82, 4.15, 32.53, 5.47, 10.45, 18.96]} \ No newline at end of file diff --git a/annotations_filtered/kYA9hvcLekg_filtered.json b/annotations_filtered/kYA9hvcLekg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9e518fc2cc6c093def5a6cdc42c7b48580f813c --- /dev/null +++ b/annotations_filtered/kYA9hvcLekg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.46], [25.0, 30.06], [33.0, 33.52], [34.0, 35.26], [36.0, 37.59], [39.0, 39.82], [42.0, 41.93], [44.0, 48.17], [49.0, 60.99], [61.0, 69.79], [72.0, 91.13], [94.0, 111.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 87.92, 94.37, 94.07, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 5.06, 0.52, 1.26, 1.59, 0.82, -0.07, 4.17, 11.99, 8.79, 19.13, 17.75]} \ No newline at end of file diff --git a/annotations_filtered/kYFrx0jdcoY_filtered.json b/annotations_filtered/kYFrx0jdcoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1ab74cb50b00d2bfd9f76042f4c35f7be856d09 --- /dev/null +++ b/annotations_filtered/kYFrx0jdcoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [13.0, 13.51], [16.0, 16.48], [18.0, 17.85], [26.0, 26.97], [29.0, 31.14], [33.0, 33.47], [37.0, 37.86], [38.0, 38.62], [43.0, 43.33], [50.0, 51.65], [53.0, 56.52], [62.0, 77.62], [83.0, 96.55], [98.0, 97.82], [98.0, 99.23], [100.0, 100.97], [103.0, 103.79], [109.0, 109.56], [110.0, 113.81], [114.0, 116.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 36.59, 37.26, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 50.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 15.73], ["hum", 13.09], ["car", 9.56]], [["buzz", 21.48], ["hum", 12.0], ["noise", 8.64]], null, null, null, null, null, [["vehicle", 49.06], ["car", 17.53], ["speech", 11.45]], null], "duration": [0.52, 0.51, 0.48, -0.15, 0.97, 2.14, 0.47, 0.86, 0.62, 0.33, 1.65, 3.52, 15.62, 13.55, -0.18, 1.23, 0.97, 0.79, 0.56, 3.81, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/kYHCKF2WLA8_filtered.json b/annotations_filtered/kYHCKF2WLA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..187aba24236ca892ba200f1828b34d4fd70064ea --- /dev/null +++ b/annotations_filtered/kYHCKF2WLA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.02], [13.0, 14.35], [17.0, 17.78], [25.0, 26.0], [36.0, 40.15], [47.0, 47.34], [55.0, 55.59], [62.0, 87.03], [87.0, 128.38]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 32.78, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 61.62], ["rumble", 14.91], ["music", 5.66]], null, null, [["music", 33.64], ["whale vocalization", 15.16], ["singing bowl", 12.73]], null], "duration": [1.02, 1.35, 0.78, 1.0, 4.15, 0.34, 0.59, 25.03, 41.38]} \ No newline at end of file diff --git a/annotations_filtered/kYQkkpRXgP4_filtered.json b/annotations_filtered/kYQkkpRXgP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a70c0df779e4113c5d4022ed23d26da0f9a04884 --- /dev/null +++ b/annotations_filtered/kYQkkpRXgP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.79], [9.0, 9.41], [14.0, 13.8], [15.0, 15.67], [18.0, 18.03], [19.0, 20.66], [21.0, 23.6], [25.0, 24.8], [26.0, 26.37], [27.0, 28.68], [30.0, 31.26], [35.0, 35.41], [37.0, 38.52], [43.0, 43.44], [52.0, 53.5], [55.0, 55.44], [56.0, 57.16], [59.0, 60.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.41, -0.2, 0.67, 0.03, 1.66, 2.6, -0.2, 0.37, 1.68, 1.26, 0.41, 1.52, 0.44, 1.5, 0.44, 1.16, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/kYcvOPf4GqE_filtered.json b/annotations_filtered/kYcvOPf4GqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91b3eddcc081b82caf99026fc4d489d8e20b16d0 --- /dev/null +++ b/annotations_filtered/kYcvOPf4GqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.09], [2.0, 3.13], [3.0, 3.65], [4.0, 5.63], [8.0, 8.53], [9.0, 9.66], [10.0, 10.71], [11.0, 13.24], [14.0, 14.77], [16.0, 16.5], [19.0, 18.94], [28.0, 28.49], [41.0, 41.47], [43.0, 43.19], [44.0, 44.15], [45.0, 46.52], [52.0, 54.68], [55.0, 58.19], [58.0, 61.89], [62.0, 63.14], [66.0, 66.77], [74.0, 76.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 81.17, 67.76, 0.0, 0.0, 42.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 80.23], ["chirp tone", 7.38], ["speech", 6.57]]], "duration": [0.09, 1.13, 0.65, 1.63, 0.53, 0.66, 0.71, 2.24, 0.77, 0.5, -0.06, 0.49, 0.47, 0.19, 0.15, 1.52, 2.68, 3.19, 3.89, 1.14, 0.77, 2.52]} \ No newline at end of file diff --git a/annotations_filtered/kYlPBN4yMe0_filtered.json b/annotations_filtered/kYlPBN4yMe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8163b4b119a07ae8b6f700574394f1a0aa8f8e2b --- /dev/null +++ b/annotations_filtered/kYlPBN4yMe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.25], [35.0, 35.82], [41.0, 69.06], [71.0, 98.56], [102.0, 128.93], [131.0, 147.45], [148.0, 158.33], [158.0, 158.63], [159.0, 159.16], [159.0, 169.26]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [29.72, 0.0, 29.04, 29.37, 29.64, 29.56, 33.49, 0.0, 0.0, 35.07], "audiomae_on_audioset": [[["speech", 81.07], ["vehicle", 2.46], ["music", 1.8]], null, [["cattle, bovinae", 49.99], ["moo", 28.35], ["livestock, farm animals, working animals", 15.06]], [["hum", 21.72], ["music", 16.97], ["mains hum", 9.18]], [["music", 21.59], ["grunt", 18.12], ["groan", 14.18]], [["speech", 36.24], ["music", 20.36], ["hum", 14.36]], [["hum", 51.9], ["mains hum", 16.49], ["throbbing", 10.49]], null, null, [["music", 33.71], ["grunt", 27.88], ["hum", 12.79]]], "duration": [9.25, 0.82, 28.06, 27.56, 26.93, 16.45, 10.33, 0.63, 0.16, 10.26]} \ No newline at end of file diff --git a/annotations_filtered/kYlPy24WJzU_filtered.json b/annotations_filtered/kYlPy24WJzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9909761d1a665beb4ed293e10401a6b70c33b92 --- /dev/null +++ b/annotations_filtered/kYlPy24WJzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.64], [11.0, 14.49], [15.0, 16.85], [18.0, 19.33], [20.0, 22.11], [25.0, 26.49], [30.0, 31.04], [32.0, 32.73], [33.0, 33.69], [34.0, 36.21], [37.0, 37.91], [39.0, 39.68], [51.0, 51.31], [52.0, 53.69], [62.0, 61.91], [65.0, 65.8], [68.0, 68.0], [69.0, 76.64], [78.0, 79.2], [80.0, 82.56], [86.0, 88.96], [101.0, 102.49], [103.0, 103.77], [105.0, 107.18], [110.0, 112.43], [114.0, 113.93], [115.0, 118.17], [119.0, 119.79], [124.0, 123.8], [124.0, 124.51], [125.0, 126.05], [127.0, 126.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 60.6, 0.0, 0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.19, 0.0, 40.45, 33.03, 0.0, 0.0, 33.47, 47.66, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 53.14], ["music", 20.38], ["didgeridoo", 3.38]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.33], ["speech", 26.11], ["fly, housefly", 2.8]], null, [["speech", 27.55], ["music", 17.5], ["fly, housefly", 7.05]], [["mains hum", 9.1], ["hum", 8.46], ["music", 7.09]], null, null, [["fart", 46.63], ["speech", 30.97], ["fly, housefly", 4.27]], [["music", 25.41], ["didgeridoo", 12.67], ["speech", 7.27]], null, [["speech", 23.02], ["music", 16.38], ["musical instrument", 4.24]], null, null, null, null, null], "duration": [1.64, 3.49, 1.85, 1.33, 2.11, 1.49, 1.04, 0.73, 0.69, 2.21, 0.91, 0.68, 0.31, 1.69, -0.09, 0.8, 0.0, 7.64, 1.2, 2.56, 2.96, 1.49, 0.77, 2.18, 2.43, -0.07, 3.17, 0.79, -0.2, 0.51, 1.05, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/kZCgrTDVRbI_filtered.json b/annotations_filtered/kZCgrTDVRbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2beb562a57f7a67e8c0eefae0b495df85962ae9b --- /dev/null +++ b/annotations_filtered/kZCgrTDVRbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [6.0, 6.76], [8.0, 9.34], [11.0, 11.82], [12.0, 14.25], [19.0, 20.33], [22.0, 23.45], [28.0, 29.66], [38.0, 47.33], [50.0, 51.12], [64.0, 68.96], [76.0, 76.5], [77.0, 76.71], [77.0, 77.26], [88.0, 94.07], [108.0, 111.08], [112.0, 112.75], [114.0, 116.11], [118.0, 118.22], [127.0, 130.18], [135.0, 135.58], [136.0, 137.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.63, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 73.36, 0.0, 48.87, 0.0, 0.0, 0.0, 98.99, 91.98, 0.0, 99.62, 0.0, 56.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 80.04], ["speech synthesizer", 6.6], ["music", 3.05]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 0.76, 1.34, 0.82, 2.25, 1.33, 1.45, 1.66, 9.33, 1.12, 4.96, 0.5, -0.29, 0.26, 6.07, 3.08, 0.75, 2.11, 0.22, 3.18, 0.58, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/kZMKLwtkLrI_filtered.json b/annotations_filtered/kZMKLwtkLrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f65047bd7a1044829a752b4645ed67cf3a696e64 --- /dev/null +++ b/annotations_filtered/kZMKLwtkLrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 28.58], [31.0, 33.39], [37.0, 38.42], [41.0, 40.93], [41.0, 41.0], [41.0, 41.28], [41.0, 45.47], [47.0, 52.0], [56.0, 73.53], [74.0, 75.95], [78.0, 81.36], [82.0, 87.44], [95.0, 96.48], [99.0, 99.74], [106.0, 106.35], [107.0, 108.26], [109.0, 110.19], [111.0, 116.06], [116.0, 120.19], [122.0, 125.39], [126.0, 128.02], [131.0, 131.87], [132.0, 134.99], [139.0, 139.21], [140.0, 145.23], [148.0, 150.89], [154.0, 155.93]], "keep_status": [false, false, false, false, false, false, true, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 32.61, 28.37, 31.38, 0.0, 32.69, 30.06, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 58.81, 100.0, 99.92, 0.0, 61.87, 0.0, 74.76, 30.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.48], ["electric shaver, electric razor", 22.45], ["music", 6.13]], [["music", 18.46], ["speech", 16.44], ["livestock, farm animals, working animals", 14.4]], [["speech", 29.85], ["electric shaver, electric razor", 21.58], ["music", 8.82]], null, [["music", 54.19], ["cacophony", 4.39], ["hum", 3.91]], [["speech", 38.57], ["music", 14.12], ["hum", 11.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["baby cry, infant cry", 18.08], ["wail, moan", 14.77], ["whimper", 14.22]], null], "duration": [-0.42, 2.39, 1.42, -0.07, 0.0, 0.28, 4.47, 5.0, 17.53, 1.95, 3.36, 5.44, 1.48, 0.74, 0.35, 1.26, 1.19, 5.06, 4.19, 3.39, 2.02, 0.87, 2.99, 0.21, 5.23, 2.89, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/kZQwVWTB2hI_filtered.json b/annotations_filtered/kZQwVWTB2hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d1c4cc80ae3c9bcbdca164e7c740fa5ef7be6a2 --- /dev/null +++ b/annotations_filtered/kZQwVWTB2hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 23.25], [30.0, 41.72], [46.0, 45.69], [46.0, 51.95], [54.0, 55.48], [57.0, 63.59], [65.0, 73.43], [75.0, 76.77], [79.0, 82.36], [84.0, 106.71], [108.0, 119.55], [142.0, 144.44]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [30.37, 30.44, 0.0, 30.81, 0.0, 30.36, 30.34, 0.0, 30.55, 30.27, 30.26, 30.07], "audiomae_on_audioset": [[["music", 71.89], ["musical instrument", 9.03], ["synthesizer", 2.6]], [["music", 68.76], ["musical instrument", 5.2], ["hum", 2.98]], null, [["music", 69.01], ["trombone", 4.95], ["musical instrument", 4.0]], null, [["music", 73.49], ["musical instrument", 5.37], ["didgeridoo", 2.49]], [["music", 64.23], ["musical instrument", 10.35], ["synthesizer", 2.1]], null, [["hum", 19.53], ["mains hum", 12.64], ["gong", 9.15]], [["speech", 18.52], ["vehicle", 11.53], ["music", 9.38]], [["music", 57.3], ["brass instrument", 8.79], ["trombone", 6.61]], [["brass instrument", 28.52], ["music", 25.28], ["trombone", 20.52]]], "duration": [13.25, 11.72, -0.31, 5.95, 1.48, 6.59, 8.43, 1.77, 3.36, 22.71, 11.55, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/kZRq9scxIWM_filtered.json b/annotations_filtered/kZRq9scxIWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05d036e702ff0ebef5649fc0ae24f93b0528e920 --- /dev/null +++ b/annotations_filtered/kZRq9scxIWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.93], [32.0, 33.67], [40.0, 40.53], [41.0, 41.25], [44.0, 44.73], [45.0, 46.3], [57.0, 58.83], [74.0, 74.01], [108.0, 109.22], [110.0, 110.76], [113.0, 113.0], [124.0, 124.83], [128.0, 128.75], [164.0, 164.61], [167.0, 167.51], [174.0, 175.71], [180.0, 182.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.07, 1.67, 0.53, 0.25, 0.73, 1.3, 1.83, 0.01, 1.22, 0.76, 0.0, 0.83, 0.75, 0.61, 0.51, 1.71, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/kZcr7bw6k_k_filtered.json b/annotations_filtered/kZcr7bw6k_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d86a09dfa3c735603059b0f572082a2cb57a126d --- /dev/null +++ b/annotations_filtered/kZcr7bw6k_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [19.0, 19.92], [21.0, 21.51], [22.0, 23.53], [25.0, 27.84], [30.0, 29.86], [34.0, 34.23], [36.0, 36.36], [41.0, 41.27], [42.0, 42.74], [44.0, 46.45], [48.0, 48.0], [49.0, 49.42], [54.0, 54.14], [57.0, 57.03], [61.0, 63.83], [66.0, 74.65], [75.0, 82.59], [87.0, 88.33], [89.0, 92.25], [100.0, 100.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 56.03, 88.46, 87.37, 0.0, 94.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 0.92, 0.51, 1.53, 2.84, -0.14, 0.23, 0.36, 0.27, 0.74, 2.45, 0.0, 0.42, 0.14, 0.03, 2.83, 8.65, 7.59, 1.33, 3.25, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/kZg0_oypRpU_filtered.json b/annotations_filtered/kZg0_oypRpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddaefe35dcd25b67c13ca117f2c1e54464331273 --- /dev/null +++ b/annotations_filtered/kZg0_oypRpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [7.0, 6.88], [9.0, 8.85], [13.0, 13.68], [20.0, 20.7], [21.0, 22.27], [24.0, 23.79], [26.0, 27.35], [32.0, 31.85], [32.0, 35.23], [38.0, 39.07], [41.0, 41.18], [42.0, 42.36], [46.0, 46.74], [50.0, 50.33], [53.0, 53.86], [54.0, 54.53], [55.0, 54.92], [58.0, 58.08], [59.0, 59.95], [61.0, 61.15], [62.0, 63.05], [71.0, 73.11], [74.0, 74.41], [76.0, 76.38], [77.0, 78.53], [80.0, 83.07], [87.0, 87.44], [88.0, 89.09], [94.0, 94.53], [98.0, 98.15], [99.0, 100.89], [102.0, 102.84], [104.0, 104.23], [108.0, 108.7], [114.0, 114.45], [117.0, 119.21], [121.0, 124.58], [129.0, 133.68], [142.0, 142.62], [147.0, 148.85], [151.0, 152.25], [152.0, 154.77], [159.0, 161.01], [167.0, 168.99]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 33.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 55.11, 40.48, 0.0, 0.0, 0.0, 97.33, 40.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hammer", 22.37], ["speech", 18.2], ["tuning fork", 9.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.76], ["music", 11.47], ["groan", 6.02]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.05], ["music", 9.66], ["noise", 7.97]], null, null, null, null, [["beatboxing", 37.12], ["speech", 26.11], ["music", 8.98]], null], "duration": [1.09, -0.12, -0.15, 0.68, 0.7, 1.27, -0.21, 1.35, -0.15, 3.23, 1.07, 0.18, 0.36, 0.74, 0.33, 0.86, 0.53, -0.08, 0.08, 0.95, 0.15, 1.05, 2.11, 0.41, 0.38, 1.53, 3.07, 0.44, 1.09, 0.53, 0.15, 1.89, 0.84, 0.23, 0.7, 0.45, 2.21, 3.58, 4.68, 0.62, 1.85, 1.25, 2.77, 2.01, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/kZgE_sUrXFY_filtered.json b/annotations_filtered/kZgE_sUrXFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f7d0aba3f2417155c6c78fd68b7d34d186cbd55 --- /dev/null +++ b/annotations_filtered/kZgE_sUrXFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.52], [7.0, 8.4], [10.0, 10.27], [11.0, 11.48], [13.0, 13.83], [14.0, 14.32], [15.0, 16.53], [18.0, 20.12], [22.0, 22.03], [23.0, 23.3], [25.0, 26.54], [31.0, 31.72], [32.0, 32.95], [33.0, 34.1], [34.0, 34.94], [36.0, 36.51], [37.0, 37.84], [39.0, 39.14], [42.0, 43.44], [44.0, 44.31], [44.0, 44.42], [45.0, 45.82], [48.0, 50.62], [53.0, 54.73], [56.0, 56.35], [57.0, 57.13], [58.0, 58.18], [59.0, 60.45], [62.0, 63.41], [68.0, 67.85], [75.0, 74.95], [78.0, 81.28], [83.0, 83.73], [99.0, 100.11], [101.0, 102.51], [103.0, 104.23], [105.0, 105.81], [119.0, 121.04], [126.0, 127.14], [134.0, 135.63], [136.0, 137.76], [139.0, 140.46], [142.0, 142.15], [144.0, 144.07], [148.0, 148.2], [153.0, 153.71], [154.0, 155.28], [157.0, 158.36], [159.0, 159.41], [161.0, 161.3], [162.0, 163.05], [165.0, 165.81]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["radio", 28.72], ["mains hum", 18.73], ["speech", 16.05]], null, null, null, null, null, null, [["hum", 16.26], ["sidetone", 9.55], ["didgeridoo", 9.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 43.22], ["speech", 27.27], ["fly, housefly", 4.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.52, 1.4, 0.27, 0.48, 0.83, 0.32, 1.53, 2.12, 0.03, 0.3, 1.54, 0.72, 0.95, 1.1, 0.94, 0.51, 0.84, 0.14, 1.44, 0.31, 0.42, 0.82, 2.62, 1.73, 0.35, 0.13, 0.18, 1.45, 1.41, -0.15, -0.05, 3.28, 0.73, 1.11, 1.51, 1.23, 0.81, 2.04, 1.14, 1.63, 1.76, 1.46, 0.15, 0.07, 0.2, 0.71, 1.28, 1.36, 0.41, 0.3, 1.05, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/kZgaz49f5aE_filtered.json b/annotations_filtered/kZgaz49f5aE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..452baa522bc814f59183f2398f13b0afb05ab864 --- /dev/null +++ b/annotations_filtered/kZgaz49f5aE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.21], [33.0, 34.33], [44.0, 44.91], [47.0, 47.83], [49.0, 49.35], [51.0, 58.21], [61.0, 62.09], [64.0, 76.77], [77.0, 77.87], [80.0, 80.42], [82.0, 82.36], [83.0, 84.38], [87.0, 93.68], [98.0, 98.52], [117.0, 124.12], [124.0, 124.16], [125.0, 128.55], [130.0, 135.28], [136.0, 136.56], [141.0, 141.47], [145.0, 145.47], [147.0, 148.34], [153.0, 153.08], [157.0, 158.65]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.12, 0.0, 0.0, 0.0, 0.0, 28.57, 0.0, 28.79, 0.0, 0.0, 0.0, 0.0, 29.51, 0.0, 39.98, 0.0, 56.25, 63.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.21], ["speech", 24.04], ["didgeridoo", 15.02]], null, null, null, null, [["music", 60.51], ["electronic music", 5.51], ["didgeridoo", 5.18]], null, [["music", 48.22], ["throbbing", 8.11], ["electronic music", 7.59]], null, null, null, null, [["vehicle", 25.93], ["car", 21.02], ["throbbing", 10.87]], null, [["beatboxing", 45.46], ["speech", 35.07], ["music", 2.04]], null, null, null, null, null, null, null, null, null], "duration": [17.21, 1.33, 0.91, 0.83, 0.35, 7.21, 1.09, 12.77, 0.87, 0.42, 0.36, 1.38, 6.68, 0.52, 7.12, 0.16, 3.55, 5.28, 0.56, 0.47, 0.47, 1.34, 0.08, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/kZz5k_xsG0Q_filtered.json b/annotations_filtered/kZz5k_xsG0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccaa95c94fd2439df6f852111ca5eb3efa94696c --- /dev/null +++ b/annotations_filtered/kZz5k_xsG0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [6.0, 10.22], [11.0, 12.11], [14.0, 13.96], [14.0, 15.23], [16.0, 45.69], [48.0, 48.12], [50.0, 55.12], [57.0, 57.94], [60.0, 66.14], [67.0, 68.42], [69.0, 80.74], [86.0, 91.67], [96.0, 104.67], [105.0, 106.79], [107.0, 107.96], [111.0, 112.72], [113.0, 114.72], [120.0, 120.72], [125.0, 125.15], [125.0, 126.01], [127.0, 128.38], [129.0, 130.33], [132.0, 133.02]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.65, 0.0, 0.0, 0.0, 28.58, 0.0, 36.15, 0.0, 33.19, 0.0, 33.25, 29.23, 29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 19.72], ["throbbing", 13.41], ["music", 11.04]], null, null, null, [["speech", 48.77], ["buzz", 13.77], ["music", 9.21]], null, [["speech", 38.03], ["hum", 12.02], ["music", 11.92]], null, [["speech", 74.58], ["hum", 5.05], ["mains hum", 4.42]], null, [["hum", 49.07], ["mains hum", 26.03], ["throbbing", 11.99]], [["music", 27.48], ["throbbing", 22.89], ["hum", 15.73]], [["music", 24.04], ["speech", 20.11], ["sidetone", 5.97]], null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 4.22, 1.11, -0.04, 1.23, 29.69, 0.12, 5.12, 0.94, 6.14, 1.42, 11.74, 5.67, 8.67, 1.79, 0.96, 1.72, 1.72, 0.72, 0.15, 1.01, 1.38, 1.33, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/k_pB_zV6kVw_filtered.json b/annotations_filtered/k_pB_zV6kVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a580bec3bce1ac5ee14072781a4ff138cf2625ba --- /dev/null +++ b/annotations_filtered/k_pB_zV6kVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.72], [5.0, 12.87], [15.0, 16.73], [20.0, 21.17], [22.0, 25.32], [28.0, 29.32], [31.0, 34.06], [37.0, 36.86], [39.0, 39.39], [42.0, 42.72], [44.0, 46.09], [48.0, 60.02], [64.0, 65.64], [69.0, 68.98], [72.0, 72.1], [73.0, 75.05], [77.0, 76.6], [79.0, 79.22], [82.0, 82.07], [84.0, 85.31], [87.0, 87.51], [89.0, 90.39], [92.0, 92.28], [94.0, 96.28], [98.0, 98.98], [100.0, 100.57], [102.0, 105.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.1, 0.0, 0.0, 62.27, 0.0, 78.38, 0.0, 0.0, 0.0, 86.27, 41.16, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 23.17], ["electric shaver, electric razor", 10.89], ["mosquito", 7.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 7.87, 1.73, 1.17, 3.32, 1.32, 3.06, -0.14, 0.39, 0.72, 2.09, 12.02, 1.64, -0.02, 0.1, 2.05, -0.4, 0.22, 0.07, 1.31, 0.51, 1.39, 0.28, 2.28, 0.98, 0.57, 3.26]} \ No newline at end of file diff --git a/annotations_filtered/k_uINM_XI6I_filtered.json b/annotations_filtered/k_uINM_XI6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03291e233be04268b8a0e1bebb2bd95fcbb3e8ed --- /dev/null +++ b/annotations_filtered/k_uINM_XI6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [6.0, 7.05], [7.0, 7.59], [9.0, 13.34], [16.0, 17.63], [24.0, 24.76], [27.0, 31.09], [33.0, 34.33], [36.0, 38.67], [39.0, 40.07], [42.0, 42.35], [46.0, 46.03], [48.0, 49.79], [51.0, 53.33], [54.0, 55.29], [57.0, 59.0], [63.0, 64.3], [66.0, 68.66], [71.0, 79.56], [84.0, 85.94], [88.0, 95.34], [97.0, 99.35], [104.0, 104.57], [105.0, 108.67], [110.0, 111.23], [112.0, 112.31], [114.0, 115.82], [118.0, 119.6], [121.0, 126.03]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.17, 0.0, 0.0, 30.31, 0.0, 30.57, 0.0, 0.0, 0.0, 0.0, 31.76, 0.0, 40.36, 0.0, 37.15, 29.94, 0.0, 31.88, 29.32, 0.0, 31.65, 0.0, 0.0, 0.0, 0.0, 29.59], "audiomae_on_audioset": [null, null, null, [["mains hum", 29.44], ["hum", 26.45], ["music", 13.38]], null, null, [["music", 31.75], ["mains hum", 16.02], ["hum", 11.13]], null, [["gong", 90.28], ["music", 3.55], ["reverberation", 1.99]], null, null, null, null, [["mains hum", 55.19], ["hum", 17.34], ["music", 8.4]], null, [["mains hum", 24.71], ["sidetone", 18.29], ["speech", 11.86]], null, [["music", 30.14], ["mains hum", 14.29], ["hum", 11.61]], [["music", 77.68], ["speech", 6.34], ["foghorn", 2.14]], null, [["theremin", 54.57], ["music", 25.29], ["musical instrument", 2.3]], [["music", 37.05], ["theremin", 36.61], ["ambient music", 4.48]], null, [["music", 34.56], ["theremin", 32.88], ["keyboard (musical)", 2.49]], null, null, null, null, [["theremin", 53.66], ["music", 26.25], ["musical instrument", 3.27]]], "duration": [0.42, 1.05, 0.59, 4.34, 1.63, 0.76, 4.09, 1.33, 2.67, 1.07, 0.35, 0.03, 1.79, 2.33, 1.29, 2.0, 1.3, 2.66, 8.56, 1.94, 7.34, 2.35, 0.57, 3.67, 1.23, 0.31, 1.82, 1.6, 5.03]} \ No newline at end of file diff --git a/annotations_filtered/kaJbWpMZdwM_filtered.json b/annotations_filtered/kaJbWpMZdwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0547d1c2657e30c3d9298ef4a594b65e7c7fc1d --- /dev/null +++ b/annotations_filtered/kaJbWpMZdwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [7.0, 7.2], [8.0, 9.85], [10.0, 16.5], [17.0, 63.44], [70.0, 83.84], [87.0, 123.28]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [47.43, 0.0, 0.0, 38.43, 0.0, 28.82, 0.0], "audiomae_on_audioset": [[["music", 13.27], ["hum", 13.02], ["mains hum", 9.72]], null, null, [["speech", 46.15], ["mains hum", 15.08], ["hum", 8.56]], null, [["speech", 52.71], ["music", 14.31], ["fireworks", 3.7]], null], "duration": [2.21, 0.2, 1.85, 6.5, 46.44, 13.84, 36.28]} \ No newline at end of file diff --git a/annotations_filtered/kaJv6L8vF-Y_filtered.json b/annotations_filtered/kaJv6L8vF-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1785ce0f2a0cdb1b717d1b1b67494e3ff475383 --- /dev/null +++ b/annotations_filtered/kaJv6L8vF-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.46], [11.0, 12.87], [15.0, 18.86], [24.0, 27.73], [32.0, 31.82], [32.0, 31.99], [32.0, 33.59], [35.0, 34.87], [39.0, 39.6], [40.0, 100.77], [101.0, 101.7], [104.0, 104.72], [110.0, 111.16], [115.0, 120.46], [122.0, 122.54], [126.0, 126.32]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.1, 47.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.6], ["brass instrument", 14.65], ["trombone", 8.4]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.87, 3.86, 3.73, -0.18, -0.01, 1.59, -0.13, 0.6, 60.77, 0.7, 0.72, 1.16, 5.46, 0.54, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/kaQPejxLNRw_filtered.json b/annotations_filtered/kaQPejxLNRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f28501b83f44f054e4f4fe67286907a9a6a0eadb --- /dev/null +++ b/annotations_filtered/kaQPejxLNRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 27.82], [29.0, 29.88], [31.0, 30.81], [32.0, 33.52], [35.0, 36.32], [37.0, 37.72], [43.0, 44.17], [46.0, 46.75], [47.0, 50.65], [52.0, 54.18], [55.0, 64.4], [67.0, 69.3], [70.0, 71.36], [72.0, 72.25], [74.0, 74.68], [79.0, 80.16], [81.0, 81.62], [82.0, 83.2], [84.0, 85.16], [86.0, 89.9], [92.0, 92.82], [94.0, 104.25], [109.0, 120.28], [128.0, 129.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 56.03, 49.22, 51.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.38, 0.0, 31.3, 31.92, 0.0], "audiomae_on_audioset": [null, [["music", 62.36], ["didgeridoo", 17.0], ["synthesizer", 2.7]], null, null, null, null, null, null, null, null, null, [["music", 68.54], ["musical instrument", 5.48], ["throbbing", 4.63]], null, null, null, null, null, null, null, null, [["music", 70.3], ["synthesizer", 7.16], ["musical instrument", 4.43]], null, [["music", 84.45], ["sampler", 3.63], ["musical instrument", 1.67]], [["music", 78.46], ["funk", 1.92], ["disco", 1.89]], null], "duration": [1.0, 24.82, 0.88, -0.19, 1.52, 1.32, 0.72, 1.17, 0.75, 3.65, 2.18, 9.4, 2.3, 1.36, 0.25, 0.68, 1.16, 0.62, 1.2, 1.16, 3.9, 0.82, 10.25, 11.28, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/kaWU7XlPxV4_filtered.json b/annotations_filtered/kaWU7XlPxV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad08ebcc5f985482a1a6088a504cea59a2c14fab --- /dev/null +++ b/annotations_filtered/kaWU7XlPxV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 61.08], [61.0, 86.1], [87.0, 95.34], [101.0, 100.89], [101.0, 113.02], [116.0, 118.2], [119.0, 123.21], [124.0, 128.82], [131.0, 132.0], [135.0, 135.4]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.18, 41.62, 0.0, 64.75, 98.44, 99.93, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.82], ["hum", 28.45], ["mains hum", 18.73]], [["music", 29.12], ["shatter", 12.35], ["breaking", 11.75]], null, null, null, null, null, null, null], "duration": [32.08, 25.1, 8.34, -0.11, 12.02, 2.2, 4.21, 4.82, 1.0, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/kaXM8DMSm-g_filtered.json b/annotations_filtered/kaXM8DMSm-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2baeed316a6ba710fab68eb8ec73f5031d54e71d --- /dev/null +++ b/annotations_filtered/kaXM8DMSm-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.59], [20.0, 21.25], [23.0, 23.57], [26.0, 26.69], [35.0, 35.97], [37.0, 37.37], [38.0, 41.2], [44.0, 46.57], [61.0, 62.85], [64.0, 66.01], [70.0, 70.01], [82.0, 83.51], [85.0, 85.85], [88.0, 88.96], [104.0, 105.95], [108.0, 109.32], [112.0, 112.13], [114.0, 115.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 96.77, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 1.25, 0.57, 0.69, 0.97, 0.37, 3.2, 2.57, 1.85, 2.01, 0.01, 1.51, 0.85, 0.96, 1.95, 1.32, 0.13, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/kaZ87rTNkDA_filtered.json b/annotations_filtered/kaZ87rTNkDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c15f72b59e60f04ea48795b933ba4d978c2f72db --- /dev/null +++ b/annotations_filtered/kaZ87rTNkDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.4], [41.0, 41.12], [48.0, 48.12], [55.0, 55.17], [56.0, 56.51], [57.0, 57.38], [59.0, 60.78], [64.0, 64.45], [65.0, 64.89], [67.0, 68.15], [69.0, 68.88], [70.0, 70.5], [71.0, 71.19], [72.0, 72.5], [74.0, 74.49], [75.0, 78.24], [85.0, 86.31], [97.0, 99.87], [107.0, 108.09], [118.0, 118.98], [119.0, 119.5], [120.0, 120.26], [120.0, 121.2], [123.0, 125.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.55, 0.0, 43.35, 0.0, 0.0, 0.0, 0.0, 0.0, 34.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 30.49], ["moo", 27.31], ["livestock, farm animals, working animals", 18.63]], null, [["speech", 20.69], ["music", 9.77], ["cattle, bovinae", 8.08]], null, null, null, null, null, [["speech", 42.28], ["music", 9.33], ["hum", 6.79]]], "duration": [0.4, 0.12, 0.12, 0.17, 0.51, 0.38, 1.78, 0.45, -0.11, 1.15, -0.12, 0.5, 0.19, 0.5, 0.49, 3.24, 1.31, 2.87, 1.09, 0.98, 0.5, 0.26, 1.2, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/kb4jEHmH_kU_filtered.json b/annotations_filtered/kb4jEHmH_kU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9464e04de5f139801d547fc394e1b9fb2ec98283 --- /dev/null +++ b/annotations_filtered/kb4jEHmH_kU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [5.0, 7.3], [12.0, 15.5], [21.0, 22.96], [25.0, 31.87], [36.0, 41.61], [44.0, 54.51], [58.0, 59.46], [60.0, 63.59], [64.0, 66.39], [67.0, 69.6], [71.0, 72.18], [73.0, 75.02], [78.0, 79.57], [81.0, 82.22], [84.0, 85.21], [88.0, 90.05], [91.0, 95.25], [97.0, 100.53], [101.0, 103.1], [104.0, 107.0], [108.0, 136.05], [141.0, 142.2], [143.0, 144.0], [146.0, 147.19], [148.0, 149.61], [151.0, 152.19], [153.0, 154.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.43, 88.83, 0.0, 81.53, 48.19, 77.53, 0.0, 99.05, 94.22, 98.44, 0.0, 97.43, 0.0, 0.0, 0.0, 99.68, 99.56, 99.99, 90.78, 99.99, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 64.65], ["musical instrument", 6.02], ["theremin", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 2.3, 3.5, 1.96, 6.87, 5.61, 10.51, 1.46, 3.59, 2.39, 2.6, 1.18, 2.02, 1.57, 1.22, 1.21, 2.05, 4.25, 3.53, 2.1, 3.0, 28.05, 1.2, 1.0, 1.19, 1.61, 1.19, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/kb7T9oK0tF8_filtered.json b/annotations_filtered/kb7T9oK0tF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd39b72ca377f4d566acc0f9f6cb991979381bc2 --- /dev/null +++ b/annotations_filtered/kb7T9oK0tF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.35], [35.0, 95.12]], "keep_status": [false, false], "silence_prob": [36.61, 0.0], "audiomae_on_audioset": [[["music", 62.26], ["hum", 4.74], ["throbbing", 4.16]], null], "duration": [15.35, 60.12]} \ No newline at end of file diff --git a/annotations_filtered/kbGvnI1qIz8_filtered.json b/annotations_filtered/kbGvnI1qIz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d85d315fb83c3a60a9bb5b3d57f41c6afce5d144 --- /dev/null +++ b/annotations_filtered/kbGvnI1qIz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 3.75], [6.0, 7.06], [8.0, 8.33], [11.0, 11.64], [13.0, 13.29], [16.0, 18.23], [19.0, 20.29], [22.0, 22.33], [25.0, 25.27], [27.0, 27.28], [32.0, 32.66], [35.0, 35.67], [37.0, 38.03], [40.0, 40.34], [45.0, 45.18], [46.0, 46.89], [48.0, 48.32], [51.0, 51.61], [63.0, 64.0], [64.0, 64.74], [66.0, 66.61], [69.0, 68.86], [71.0, 71.41], [74.0, 74.17], [75.0, 76.87], [79.0, 81.31], [84.0, 84.37], [91.0, 93.6], [95.0, 95.47], [96.0, 96.9], [99.0, 99.59], [102.0, 103.05], [105.0, 105.34], [106.0, 107.18], [108.0, 111.2], [112.0, 113.12], [114.0, 122.07], [123.0, 123.63], [125.0, 126.81], [129.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 44.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 74.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.63], ["radio", 12.8], ["noise", 5.35]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.75, 1.06, 0.33, 0.64, 0.29, 2.23, 1.29, 0.33, 0.27, 0.28, 0.66, 0.67, 1.03, 0.34, 0.18, 0.89, 0.32, 0.61, 1.0, 0.74, 0.61, -0.14, 0.41, 0.17, 1.87, 2.31, 0.37, 2.6, 0.47, 0.9, 0.59, 1.05, 0.34, 1.18, 3.2, 1.12, 8.07, 0.63, 1.81, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/kbVtjc-ygTM_filtered.json b/annotations_filtered/kbVtjc-ygTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e44bd2a883cf8a6a655992ca378ab4602696724a --- /dev/null +++ b/annotations_filtered/kbVtjc-ygTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.13], [8.0, 7.65], [12.0, 12.36], [15.0, 15.79], [32.0, 32.95], [34.0, 36.09], [37.0, 38.01], [50.0, 51.17], [55.0, 58.58], [60.0, 60.18], [66.0, 66.65], [70.0, 70.83], [73.0, 72.57], [77.0, 77.99], [85.0, 85.21], [97.0, 98.41], [100.0, 101.29], [102.0, 102.02], [103.0, 104.18], [113.0, 113.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, -0.35, 0.36, 0.79, 0.95, 2.09, 1.01, 1.17, 3.58, 0.18, 0.65, 0.83, -0.43, 0.99, 0.21, 1.41, 1.29, 0.02, 1.18, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/kbb1MUQmusU_filtered.json b/annotations_filtered/kbb1MUQmusU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbe21a1be9cba0714761614041403f610e5755f7 --- /dev/null +++ b/annotations_filtered/kbb1MUQmusU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.29], [21.0, 25.15], [28.0, 31.4], [34.0, 58.26], [59.0, 78.19], [81.0, 82.49], [83.0, 84.21], [88.0, 88.91], [92.0, 92.69], [96.0, 98.78], [100.0, 103.87], [104.0, 107.86], [109.0, 109.86], [112.0, 113.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [85.72, 66.15, 85.72, 73.51, 51.94, 0.0, 0.0, 0.0, 0.0, 72.16, 45.3, 41.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 50.74], ["musical instrument", 4.15], ["synthesizer", 4.01]], [["music", 30.29], ["speech", 21.79], ["theremin", 7.42]], null, null], "duration": [2.29, 4.15, 3.4, 24.26, 19.19, 1.49, 1.21, 0.91, 0.69, 2.78, 3.87, 3.86, 0.86, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/kbpdM9ORaI8_filtered.json b/annotations_filtered/kbpdM9ORaI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..478be32f2a89df6ae48e30dd1d2a9da88116af9d --- /dev/null +++ b/annotations_filtered/kbpdM9ORaI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 23.67], [25.0, 45.87], [47.0, 60.96], [62.0, 75.93]], "keep_status": [false, true, true, false], "silence_prob": [33.5, 31.53, 31.9, 30.35], "audiomae_on_audioset": [[["music", 78.52], ["speech", 3.7], ["musical instrument", 2.03]], [["music", 34.62], ["whack, thwack", 9.97], ["mosquito", 8.9]], [["music", 64.99], ["musical instrument", 2.47], ["whack, thwack", 2.32]], [["music", 57.23], ["synthesizer", 7.47], ["electronic music", 5.48]]], "duration": [11.67, 20.87, 13.96, 13.93]} \ No newline at end of file diff --git a/annotations_filtered/kcDEHkSgpuw_filtered.json b/annotations_filtered/kcDEHkSgpuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf4117b0298c77a8d9ff7ffda688c0363cb814ff --- /dev/null +++ b/annotations_filtered/kcDEHkSgpuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 14.07], [18.0, 19.74], [21.0, 21.73], [25.0, 46.75], [48.0, 49.76], [53.0, 57.6], [59.0, 58.95], [59.0, 67.76], [69.0, 69.28], [71.0, 71.91], [74.0, 75.14], [85.0, 85.04], [85.0, 89.07], [91.0, 93.78]], "keep_status": [true, false, false, false, false, true, false, true, false, false, false, false, true, false], "silence_prob": [30.0, 0.0, 0.0, 29.49, 0.0, 46.64, 0.0, 41.07, 0.0, 0.0, 0.0, 0.0, 30.86, 30.42], "audiomae_on_audioset": [[["mains hum", 24.35], ["hum", 23.66], ["sidetone", 16.49]], null, null, [["hum", 29.18], ["mains hum", 29.07], ["music", 19.83]], null, [["music", 31.79], ["hum", 18.65], ["mains hum", 7.1]], null, [["music", 24.9], ["hum", 22.56], ["mains hum", 10.28]], null, null, null, null, [["whip", 14.82], ["electric shaver, electric razor", 10.83], ["music", 9.78]], [["music", 59.59], ["musical instrument", 14.11], ["didgeridoo", 4.3]]], "duration": [13.07, 1.74, 0.73, 21.75, 1.76, 4.6, -0.05, 8.76, 0.28, 0.91, 1.14, 0.04, 4.07, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/kcYN8phvjSY_filtered.json b/annotations_filtered/kcYN8phvjSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74905a17ca322b13573ae9050bef295aa855deea --- /dev/null +++ b/annotations_filtered/kcYN8phvjSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.57], [20.0, 21.34], [34.0, 39.53], [47.0, 100.36], [101.0, 102.2], [103.0, 113.61]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 63.42, 0.0, 0.0, 32.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 77.45], ["theremin", 9.63], ["effects unit", 1.16]]], "duration": [0.57, 1.34, 5.53, 53.36, 1.2, 10.61]} \ No newline at end of file diff --git a/annotations_filtered/kcrHhDoUS1k_filtered.json b/annotations_filtered/kcrHhDoUS1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce5ca57329adb24780167781bf584447628ff360 --- /dev/null +++ b/annotations_filtered/kcrHhDoUS1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.5], [17.0, 17.27], [19.0, 19.2], [24.0, 36.24], [37.0, 37.32], [39.0, 40.32], [46.0, 46.75], [50.0, 49.92], [52.0, 52.39], [64.0, 66.7], [70.0, 70.7], [75.0, 75.17], [76.0, 78.76], [82.0, 90.22], [94.0, 106.05], [106.0, 113.63], [116.0, 125.34], [127.0, 132.02], [138.0, 139.31], [140.0, 141.3], [143.0, 151.41], [152.0, 153.0], [153.0, 154.14], [160.0, 164.19], [165.0, 173.96]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, true, false], "silence_prob": [35.4, 0.0, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 0.0, 32.15, 0.0, 0.0, 41.81, 34.64, 32.4, 33.91, 30.98, 29.3, 0.0, 0.0, 29.89, 0.0, 0.0, 33.56, 29.76], "audiomae_on_audioset": [[["music", 54.57], ["hum", 4.46], ["musical instrument", 3.39]], null, null, [["music", 23.42], ["cattle, bovinae", 17.76], ["livestock, farm animals, working animals", 12.74]], null, null, null, null, null, [["music", 48.75], ["theremin", 12.44], ["hum", 5.71]], null, null, [["throbbing", 46.85], ["hum", 24.3], ["music", 17.93]], [["throbbing", 51.63], ["hum", 19.73], ["music", 17.62]], [["music", 31.84], ["whack, thwack", 12.06], ["hum", 8.24]], [["hum", 41.16], ["mains hum", 17.27], ["throbbing", 13.5]], [["hum", 38.41], ["throbbing", 24.23], ["mains hum", 22.77]], [["breaking", 13.54], ["whack, thwack", 8.52], ["music", 6.02]], null, null, [["music", 25.38], ["didgeridoo", 10.24], ["livestock, farm animals, working animals", 5.98]], null, null, [["music", 40.89], ["whale vocalization", 13.92], ["throbbing", 5.92]], [["speech", 54.21], ["music", 14.46], ["fly, housefly", 8.31]]], "duration": [9.5, 0.27, 0.2, 12.24, 0.32, 1.32, 0.75, -0.08, 0.39, 2.7, 0.7, 0.17, 2.76, 8.22, 12.05, 7.63, 9.34, 5.02, 1.31, 1.3, 8.41, 1.0, 1.14, 4.19, 8.96]} \ No newline at end of file diff --git a/annotations_filtered/kd01w5eLVwo_filtered.json b/annotations_filtered/kd01w5eLVwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846b12ff166215eed7e5268d962b083229a71a3c --- /dev/null +++ b/annotations_filtered/kd01w5eLVwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 97.68], [98.0, 102.05], [103.0, 104.85], [106.0, 107.2], [108.0, 112.28], [113.0, 114.78], [115.0, 117.36], [118.0, 122.81], [123.0, 125.24], [126.0, 129.1], [130.0, 133.08], [134.0, 137.2], [138.0, 142.67], [144.0, 148.34], [149.0, 151.33], [152.0, 153.77], [155.0, 158.08], [159.0, 167.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 0.0, 0.0, 99.26, 0.0, 78.21, 99.05, 98.73, 99.87, 97.33, 97.43, 95.64, 99.56, 99.88, 0.0, 99.92, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [70.68, 4.05, 1.85, 1.2, 4.28, 1.78, 2.36, 4.81, 2.24, 3.1, 3.08, 3.2, 4.67, 4.34, 2.33, 1.77, 3.08, 8.0]} \ No newline at end of file diff --git a/annotations_filtered/kdDH7Ynw5Lc_filtered.json b/annotations_filtered/kdDH7Ynw5Lc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kdDH7Ynw5Lc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kdTfLDIbwow_filtered.json b/annotations_filtered/kdTfLDIbwow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1eeb9ed2f48e6f7f2cb703d7e2606e12b194f14 --- /dev/null +++ b/annotations_filtered/kdTfLDIbwow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.63], [23.0, 23.6], [44.0, 44.22], [45.0, 46.84], [51.0, 52.54], [55.0, 57.92], [61.0, 64.69], [66.0, 66.51], [105.0, 106.19], [118.0, 119.79]], "keep_status": [false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.46, 34.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 51.49], ["hum", 7.81], ["rumble", 5.08]], [["fly, housefly", 19.89], ["speech", 13.17], ["insect", 11.23]], null, null, null], "duration": [0.63, 0.6, 0.22, 1.84, 1.54, 2.92, 3.69, 0.51, 1.19, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/kdW1wdpEP4Y_filtered.json b/annotations_filtered/kdW1wdpEP4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0d3854c4669efea84dea0b6385fd87a82fcc5c9 --- /dev/null +++ b/annotations_filtered/kdW1wdpEP4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.41], [17.0, 19.2], [20.0, 20.95], [27.0, 27.28], [28.0, 28.85]], "keep_status": [true, false, false, false, false], "silence_prob": [33.67, 60.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.49], ["didgeridoo", 9.9], ["cattle, bovinae", 7.61]], null, null, null, null], "duration": [5.41, 2.2, 0.95, 0.28, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/kdbGqJtHWQg_filtered.json b/annotations_filtered/kdbGqJtHWQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c127b6d039bf6b5f5ac8feaad9f2dc32ca4d8e86 --- /dev/null +++ b/annotations_filtered/kdbGqJtHWQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 93.68], [98.0, 99.47], [100.0, 100.36], [101.0, 102.22], [103.0, 104.72]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [83.68, 1.47, 0.36, 1.22, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/kdbRwpxZHJY_filtered.json b/annotations_filtered/kdbRwpxZHJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e89f00d8346f5731ae19cc5053c5be8b4b97ff2 --- /dev/null +++ b/annotations_filtered/kdbRwpxZHJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.69], [17.0, 17.56], [31.0, 32.1], [44.0, 44.34], [73.0, 72.91]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.69, 0.56, 1.1, 0.34, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/kdkVnZsOgJA_filtered.json b/annotations_filtered/kdkVnZsOgJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40818de37ee1fe8ed8ccac3412bdfdd19ce2a4f9 --- /dev/null +++ b/annotations_filtered/kdkVnZsOgJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [9.0, 10.4], [11.0, 11.53], [15.0, 15.23], [16.0, 16.5], [17.0, 17.31], [18.0, 18.67], [22.0, 21.83], [34.0, 34.96], [40.0, 40.61], [42.0, 43.09], [44.0, 44.64], [47.0, 46.8], [48.0, 48.91], [50.0, 51.39], [54.0, 54.36], [59.0, 58.9], [60.0, 59.73], [62.0, 63.05], [64.0, 64.59], [67.0, 68.4], [74.0, 77.5], [79.0, 79.71], [83.0, 83.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.4, 0.53, 0.23, 0.5, 0.31, 0.67, -0.17, 0.96, 0.61, 1.09, 0.64, -0.2, 0.91, 1.39, 0.36, -0.1, -0.27, 1.05, 0.59, 1.4, 3.5, 0.71, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/kdrPUm5zBqA_filtered.json b/annotations_filtered/kdrPUm5zBqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84852f4aeb7d3237cf26f75d9a551e8af3807a77 --- /dev/null +++ b/annotations_filtered/kdrPUm5zBqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.1], [11.0, 11.53], [18.0, 18.52], [49.0, 51.16], [54.0, 56.56], [62.0, 65.16], [68.0, 71.76], [75.0, 80.86], [81.0, 82.27], [89.0, 89.78], [92.0, 92.53], [93.0, 93.95], [106.0, 108.97], [113.0, 125.81], [134.0, 134.45], [137.0, 138.77], [139.0, 139.56], [146.0, 146.18], [150.0, 151.21], [151.0, 159.75]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.92, 36.66, 39.82, 37.75, 35.77, 0.0, 0.0, 0.0, 0.0, 33.39, 34.63, 0.0, 0.0, 0.0, 0.0, 0.0, 36.18], "audiomae_on_audioset": [null, null, null, [["speech", 30.5], ["music", 22.85], ["didgeridoo", 7.93]], [["music", 60.27], ["electronic music", 5.68], ["grunt", 3.88]], [["music", 52.89], ["throbbing", 18.92], ["synthesizer", 6.98]], [["music", 47.14], ["speech", 10.46], ["didgeridoo", 8.91]], [["music", 58.9], ["throbbing", 12.44], ["speech", 8.63]], null, null, null, null, [["fart", 76.89], ["music", 16.16], ["fly, housefly", 0.78]], [["music", 82.33], ["electronic music", 1.7], ["synthesizer", 1.34]], null, null, null, null, null, [["music", 70.88], ["electronic music", 4.01], ["didgeridoo", 2.85]]], "duration": [1.1, 0.53, 0.52, 2.16, 2.56, 3.16, 3.76, 5.86, 1.27, 0.78, 0.53, 0.95, 2.97, 12.81, 0.45, 1.77, 0.56, 0.18, 1.21, 8.75]} \ No newline at end of file diff --git a/annotations_filtered/kearXmroxUM_filtered.json b/annotations_filtered/kearXmroxUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4fb34eda9c620894f27b368bf9ad91362640e97 --- /dev/null +++ b/annotations_filtered/kearXmroxUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.31], [18.0, 27.51], [29.0, 30.87], [32.0, 32.66], [34.0, 35.7], [36.0, 36.64], [37.0, 39.95], [42.0, 48.88], [49.0, 50.35], [51.0, 51.51], [52.0, 54.06], [56.0, 59.12], [60.0, 64.35], [66.0, 68.42], [70.0, 73.72], [75.0, 83.08], [84.0, 84.42], [85.0, 87.0], [89.0, 90.48], [91.0, 92.25], [97.0, 97.56], [98.0, 99.13], [100.0, 100.53], [102.0, 102.14], [105.0, 106.32], [108.0, 108.6], [110.0, 112.11], [113.0, 113.75], [114.0, 114.86], [116.0, 117.69], [118.0, 118.81], [123.0, 122.88], [125.0, 126.66], [128.0, 128.78], [134.0, 134.1]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 56.33, 61.97, 0.0, 0.0, 42.55, 36.3, 57.72, 61.37, 88.28, 62.78, 0.0, 39.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["noise", 10.24], ["telephone", 8.53], ["radio", 7.54]], null, null, null, null, null, null, null, null, [["speech", 37.6], ["sidetone", 8.4], ["radio", 7.99]], [["speech", 29.37], ["chirp tone", 25.88], ["burping, eructation", 8.41]], null, null, null, null, null, [["speech", 21.91], ["telephone dialing, dtmf", 6.37], ["music", 5.27]], null, null, null, null, null, null, null, null, [["speech", 23.25], ["dial tone", 17.98], ["busy signal", 15.56]], null, null, null, null, null, null, null, null], "duration": [1.31, 9.51, 1.87, 0.66, 1.7, 0.64, 2.95, 6.88, 1.35, 0.51, 2.06, 3.12, 4.35, 2.42, 3.72, 8.08, 0.42, 2.0, 1.48, 1.25, 0.56, 1.13, 0.53, 0.14, 1.32, 0.6, 2.11, 0.75, 0.86, 1.69, 0.81, -0.12, 1.66, 0.78, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/kevJJDQloNE_filtered.json b/annotations_filtered/kevJJDQloNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f972268705b2f9e15b2ba85254af46e3d59e3fae --- /dev/null +++ b/annotations_filtered/kevJJDQloNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.93], [20.0, 22.0], [25.0, 77.46], [82.0, 85.62]], "keep_status": [false, false, false, false], "silence_prob": [31.08, 30.34, 0.0, 30.44], "audiomae_on_audioset": [[["music", 80.83], ["disco", 3.47], ["synthesizer", 2.05]], [["music", 69.23], ["house music", 4.88], ["electronic music", 2.14]], null, [["music", 71.98], ["disco", 4.47], ["house music", 2.47]]], "duration": [12.93, 2.0, 52.46, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/kf8NklFXAd4_filtered.json b/annotations_filtered/kf8NklFXAd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04ac69b2b7e11766d0c113c94964a6d325bd68b6 --- /dev/null +++ b/annotations_filtered/kf8NklFXAd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [3.0, 3.74], [6.0, 6.83], [8.0, 9.32], [20.0, 20.61], [23.0, 28.58], [30.0, 34.03], [38.0, 61.05], [62.0, 63.44], [64.0, 72.74], [75.0, 113.88]], "keep_status": [false, false, false, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.4, 33.26, 31.65, 0.0, 31.09, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 32.45], ["radio", 6.0], ["music", 5.36]], [["speech", 54.88], ["vehicle", 3.17], ["hum", 2.84]], [["music", 30.18], ["speech", 20.07], ["radio", 4.84]], null, [["speech", 29.0], ["vehicle", 13.12], ["car", 7.86]], null], "duration": [1.56, 0.74, 0.83, 1.32, 0.61, 5.58, 4.03, 23.05, 1.44, 8.74, 38.88]} \ No newline at end of file diff --git a/annotations_filtered/kfdeG-hRX7A_filtered.json b/annotations_filtered/kfdeG-hRX7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9ab5868578811130dd3e79a6f4a27b080c47759 --- /dev/null +++ b/annotations_filtered/kfdeG-hRX7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.02], [10.0, 10.83], [11.0, 11.79], [13.0, 14.45], [27.0, 26.69], [29.0, 29.29], [30.0, 30.5], [32.0, 32.97], [34.0, 37.0], [37.0, 39.02], [44.0, 46.47], [47.0, 47.63], [49.0, 49.1], [50.0, 50.45], [51.0, 54.92], [58.0, 58.26], [59.0, 60.79], [67.0, 69.9], [71.0, 72.15], [73.0, 89.94], [97.0, 106.03], [107.0, 108.94], [116.0, 117.8], [118.0, 119.1], [120.0, 120.39], [131.0, 139.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.84, 50.71, 83.7, 0.0, 0.0, 0.0, 34.86, 0.0, 0.0, 29.65, 0.0, 32.77, 32.29, 0.0, 0.0, 0.0, 0.0, 30.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 31.78], ["hum", 25.41], ["music", 13.98]], null, null, [["music", 52.86], ["speech", 14.29], ["synthesizer", 9.4]], null, [["music", 69.73], ["musical instrument", 6.68], ["effects unit", 5.37]], [["music", 81.91], ["boing", 2.44], ["rock and roll", 1.91]], null, null, null, null, [["hum", 36.83], ["throbbing", 31.31], ["music", 14.75]]], "duration": [0.02, 0.83, 0.79, 1.45, -0.31, 0.29, 0.5, 0.97, 3.0, 2.02, 2.47, 0.63, 0.1, 0.45, 3.92, 0.26, 1.79, 2.9, 1.15, 16.94, 9.03, 1.94, 1.8, 1.1, 0.39, 8.72]} \ No newline at end of file diff --git a/annotations_filtered/kflvHGnIkoA_filtered.json b/annotations_filtered/kflvHGnIkoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebde837af0ceda41e5d29250ef1be68bde437ab2 --- /dev/null +++ b/annotations_filtered/kflvHGnIkoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.77], [15.0, 17.83], [41.0, 41.74], [51.0, 52.49], [63.0, 63.22], [65.0, 65.5], [75.0, 75.34], [79.0, 84.1], [85.0, 86.71], [91.0, 92.74], [93.0, 94.74], [95.0, 94.78]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 30.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 24.21], ["speech", 17.41], ["hum", 16.41]], null, null, null, null, null, [["music", 46.56], ["theremin", 14.5], ["musical instrument", 3.78]], null, null, null, null], "duration": [0.77, 2.83, 0.74, 1.49, 0.22, 0.5, 0.34, 5.1, 1.71, 1.74, 1.74, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/kg2o35acq4c_filtered.json b/annotations_filtered/kg2o35acq4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27772631567c93481d7f8b360dd9df3d2bb35e52 --- /dev/null +++ b/annotations_filtered/kg2o35acq4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.53], [11.0, 13.51], [15.0, 15.97], [18.0, 20.22], [21.0, 25.14], [30.0, 30.47], [36.0, 38.1], [40.0, 40.73], [42.0, 43.98], [45.0, 46.28], [51.0, 50.75], [53.0, 55.81], [58.0, 70.23], [71.0, 71.12], [73.0, 74.83], [78.0, 80.13], [83.0, 85.78], [88.0, 88.86], [89.0, 90.49], [92.0, 94.85], [98.0, 98.15], [103.0, 104.19], [106.0, 106.1], [110.0, 112.38], [114.0, 114.59], [115.0, 115.57], [119.0, 120.72], [122.0, 131.67], [140.0, 141.1], [141.0, 142.77], [150.0, 150.36], [151.0, 151.11], [153.0, 152.88], [155.0, 155.06], [158.0, 157.76], [160.0, 159.81], [160.0, 161.7], [163.0, 163.32], [164.0, 164.34], [165.0, 165.86], [167.0, 167.71], [174.0, 175.07], [176.0, 176.71], [177.0, 178.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.03, 0.0, 69.07, 47.98, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 53.22, 68.02, 0.0, 0.0, 50.26, 57.97, 0.0, 0.0, 43.87, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 35.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 71.13], ["hum", 7.24], ["rumble", 2.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.56], ["music", 12.17], ["gong", 10.63]], null, null, null, null, null, null, null, [["whale vocalization", 43.73], ["noise", 16.35], ["animal", 4.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 2.51, 0.97, 2.22, 4.14, 0.47, 2.1, 0.73, 1.98, 1.28, -0.25, 2.81, 12.23, 0.12, 1.83, 2.13, 2.78, 0.86, 1.49, 2.85, 0.15, 1.19, 0.1, 2.38, 0.59, 0.57, 1.72, 9.67, 1.1, 1.77, 0.36, 0.11, -0.12, 0.06, -0.24, -0.19, 1.7, 0.32, 0.34, 0.86, 0.71, 1.07, 0.71, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/kg3erAXOz34_filtered.json b/annotations_filtered/kg3erAXOz34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9c663706f98f58d0ccb5d7592b430166716d8a6 --- /dev/null +++ b/annotations_filtered/kg3erAXOz34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.23], [14.0, 14.49], [19.0, 19.6], [32.0, 33.66], [41.0, 40.76], [41.0, 44.09], [49.0, 51.34], [61.0, 61.35], [63.0, 63.73], [64.0, 64.03], [67.0, 67.88], [72.0, 72.77], [74.0, 74.39], [74.0, 74.87], [78.0, 79.3], [88.0, 96.92], [103.0, 103.6], [106.0, 106.59], [108.0, 108.3], [109.0, 110.57], [113.0, 113.27], [114.0, 115.52], [117.0, 118.2], [124.0, 124.16], [126.0, 127.75], [139.0, 139.43], [140.0, 142.87], [149.0, 149.12], [151.0, 150.79], [152.0, 152.93], [155.0, 155.24], [157.0, 158.04], [159.0, 160.51], [161.0, 164.66], [165.0, 168.05]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.12, 29.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.87, 32.94], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 31.99], ["music", 26.49], ["hum", 6.42]], [["music", 33.41], ["speech", 12.31], ["cattle, bovinae", 10.94]], null, null, null, null, null, null, null, null, [["boing", 66.74], ["music", 26.36], ["speech", 4.43]], null, null, null, null, null, null, null, null, null, null, [["music", 41.2], ["speech", 33.44], ["boing", 16.41]], null, null, null, null, null, null, [["music", 23.53], ["bleat", 20.84], ["sheep", 17.24]], [["speech", 58.24], ["electric shaver, electric razor", 18.36], ["music", 4.6]]], "duration": [0.23, 0.49, 0.6, 1.66, -0.24, 3.09, 2.34, 0.35, 0.73, 0.03, 0.88, 0.77, 0.39, 0.87, 1.3, 8.92, 0.6, 0.59, 0.3, 1.57, 0.27, 1.52, 1.2, 0.16, 1.75, 0.43, 2.87, 0.12, -0.21, 0.93, 0.24, 1.04, 1.51, 3.66, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/kg7goEASO5E_filtered.json b/annotations_filtered/kg7goEASO5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..454a6f90d17d28834b8d752eef6227ca9fb7fd42 --- /dev/null +++ b/annotations_filtered/kg7goEASO5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [8.0, 9.21], [10.0, 11.08], [12.0, 13.24], [16.0, 23.6], [24.0, 25.0], [27.0, 48.46], [49.0, 59.95], [64.0, 65.77], [68.0, 68.13], [69.0, 69.03], [72.0, 72.42], [73.0, 73.58], [77.0, 77.68], [79.0, 80.37], [83.0, 83.49], [85.0, 86.66], [90.0, 89.99], [93.0, 95.01], [97.0, 98.37], [99.0, 112.95]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.38, 0.0, 33.46, 31.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 35.31], "audiomae_on_audioset": [null, null, null, null, [["vehicle", 33.05], ["car", 13.45], ["race car, auto racing", 6.78]], null, [["music", 66.66], ["speech", 7.34], ["vehicle", 6.62]], [["speech", 46.34], ["vehicle", 14.76], ["music", 6.57]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.84], ["speech", 12.57], ["musical instrument", 8.98]]], "duration": [0.42, 1.21, 1.08, 1.24, 7.6, 1.0, 21.46, 10.95, 1.77, 0.13, 0.03, 0.42, 0.58, 0.68, 1.37, 0.49, 1.66, -0.01, 2.01, 1.37, 13.95]} \ No newline at end of file diff --git a/annotations_filtered/kgNMy-k2VnA_filtered.json b/annotations_filtered/kgNMy-k2VnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..163c59969f537fb19a77b6187829c58a6932bbd7 --- /dev/null +++ b/annotations_filtered/kgNMy-k2VnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.06], [8.0, 8.33], [10.0, 11.42], [12.0, 13.74], [14.0, 14.32], [15.0, 15.9], [16.0, 17.76], [20.0, 20.68], [22.0, 22.25], [25.0, 24.83], [26.0, 28.39], [30.0, 30.45], [31.0, 33.62], [34.0, 35.82], [36.0, 39.51], [40.0, 41.94], [45.0, 46.58], [48.0, 48.83], [49.0, 49.94], [51.0, 53.45], [54.0, 57.21], [59.0, 59.97], [65.0, 66.83], [68.0, 70.33], [72.0, 75.12], [81.0, 107.76], [108.0, 111.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 57.97, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 99.78, 99.96, 0.0, 0.0, 100.0, 100.0, 78.55, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.06, 0.33, 1.42, 1.74, 0.32, 0.9, 1.76, 0.68, 0.25, -0.17, 2.39, 0.45, 2.62, 1.82, 3.51, 1.94, 1.58, 0.83, 0.94, 2.45, 3.21, 0.97, 1.83, 2.33, 3.12, 26.76, 3.03]} \ No newline at end of file diff --git a/annotations_filtered/kgRlzeYc1nk_filtered.json b/annotations_filtered/kgRlzeYc1nk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..155a8e22cf3bcea9d105c928a6ab9d9b24babf0a --- /dev/null +++ b/annotations_filtered/kgRlzeYc1nk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[111.0, 127.23], [130.0, 130.28]], "keep_status": [false, false], "silence_prob": [77.7, 0.0], "audiomae_on_audioset": [null, null], "duration": [16.23, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/kgSDN6_VyR0_filtered.json b/annotations_filtered/kgSDN6_VyR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62a4d9a7ead5ae7b1163d7d99d6a76a955ded298 --- /dev/null +++ b/annotations_filtered/kgSDN6_VyR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.97], [18.0, 18.32], [20.0, 26.4], [26.0, 28.59], [30.0, 31.33], [39.0, 47.65], [49.0, 52.39], [53.0, 54.48], [56.0, 56.35], [57.0, 61.65], [62.0, 61.69], [64.0, 64.07], [67.0, 67.39], [68.0, 79.66], [81.0, 86.43], [87.0, 88.28], [97.0, 97.02], [98.0, 102.76], [103.0, 104.28], [106.0, 122.17], [123.0, 123.21]], "keep_status": [false, false, true, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [73.51, 0.0, 41.5, 37.5, 0.0, 42.98, 55.39, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 38.28, 33.96, 0.0, 0.0, 68.54, 0.0, 37.57, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 36.52], ["cattle, bovinae", 23.48], ["moo", 8.21]], [["livestock, farm animals, working animals", 45.04], ["music", 7.0], ["cattle, bovinae", 6.69]], null, [["whale vocalization", 52.12], ["fly, housefly", 11.82], ["mosquito", 4.83]], null, null, null, [["speech", 82.02], ["effects unit", 1.92], ["radio", 1.67]], null, null, null, [["livestock, farm animals, working animals", 33.14], ["cattle, bovinae", 31.54], ["moo", 31.48]], [["speech", 10.9], ["music", 9.58], ["crowd", 5.72]], null, null, null, null, [["liquid", 25.37], ["water", 15.36], ["glass", 15.26]], null], "duration": [3.97, 0.32, 6.4, 2.59, 1.33, 8.65, 3.39, 1.48, 0.35, 4.65, -0.31, 0.07, 0.39, 11.66, 5.43, 1.28, 0.02, 4.76, 1.28, 16.17, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/kgdr5vmYZLw_filtered.json b/annotations_filtered/kgdr5vmYZLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..450ef79263950590eeabbcaae585a565b505359e --- /dev/null +++ b/annotations_filtered/kgdr5vmYZLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.75], [10.0, 14.84], [21.0, 42.99], [45.0, 45.0], [47.0, 48.46], [53.0, 53.4], [56.0, 57.81], [64.0, 65.2], [73.0, 73.79], [76.0, 77.52], [79.0, 81.43], [83.0, 83.62], [87.0, 89.01], [98.0, 100.5], [108.0, 111.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 88.46, 83.34, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 4.84, 21.99, 0.0, 1.46, 0.4, 1.81, 1.2, 0.79, 1.52, 2.43, 0.62, 2.01, 2.5, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/kgfgiLlW-yw_filtered.json b/annotations_filtered/kgfgiLlW-yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cad183e7fe8b888210b7f09e188ca61e8dab9163 --- /dev/null +++ b/annotations_filtered/kgfgiLlW-yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.87], [6.0, 5.86], [6.0, 6.0], [6.0, 6.44], [7.0, 6.67], [8.0, 8.23], [9.0, 10.08], [13.0, 14.99], [15.0, 17.29], [18.0, 19.25], [21.0, 28.07], [30.0, 31.06], [36.0, 37.5], [38.0, 61.4], [64.0, 64.66], [66.0, 68.47], [69.0, 69.28], [70.0, 81.23], [83.0, 84.27], [89.0, 90.12], [91.0, 91.2], [92.0, 92.48], [95.0, 96.15], [99.0, 100.03], [101.0, 103.23], [104.0, 104.41], [106.0, 105.7], [106.0, 106.59], [108.0, 108.6], [110.0, 110.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.35, 0.0, 45.27, 0.0, 0.0, 37.52, 0.0, 84.43, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.43, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["animal", 39.54], ["dog", 25.08], ["domestic animals, pets", 16.42]], null, [["speech", 15.28], ["eruption", 14.94], ["clip-clop", 10.85]], null, null, [["speech", 45.33], ["radio", 25.72], ["sidetone", 3.65]], null, null, null, null, null, null, null, null, null, null, [["speech", 50.41], ["music", 7.53], ["civil defense siren", 3.71]], null, null, null, null, null], "duration": [1.87, -0.14, 0.0, 0.44, -0.33, 0.23, 1.08, 1.99, 2.29, 1.25, 7.07, 1.06, 1.5, 23.4, 0.66, 2.47, 0.28, 11.23, 1.27, 1.12, 0.2, 0.48, 1.15, 1.03, 2.23, 0.41, -0.3, 0.59, 0.6, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/kghbSGoV1kE_filtered.json b/annotations_filtered/kghbSGoV1kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abc539d941017d6f1677cc437b3de8ea983dcf7b --- /dev/null +++ b/annotations_filtered/kghbSGoV1kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.37], [7.0, 8.55], [11.0, 11.13], [12.0, 12.97], [14.0, 15.15], [18.0, 18.59], [23.0, 24.09], [35.0, 39.53], [45.0, 47.21], [55.0, 84.94], [87.0, 88.2], [89.0, 92.92], [97.0, 100.7], [103.0, 105.98], [107.0, 107.57], [110.0, 110.2], [112.0, 112.46]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.3, 32.78, 30.31, 0.0, 45.43, 50.36, 44.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 43.49], ["moo", 6.9], ["livestock, farm animals, working animals", 6.76]], [["speech", 79.18], ["field recording", 1.56], ["male speech, man speaking", 1.44]], [["speech", 41.51], ["music", 5.68], ["buzz", 3.64]], null, [["sidetone", 55.54], ["speech", 23.55], ["music", 8.92]], null, [["music", 39.38], ["speech", 21.83], ["theremin", 3.16]], null, null, null], "duration": [1.37, 1.55, 0.13, 0.97, 1.15, 0.59, 1.09, 4.53, 2.21, 29.94, 1.2, 3.92, 3.7, 2.98, 0.57, 0.2, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/kglWIEtKSXY_filtered.json b/annotations_filtered/kglWIEtKSXY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..661ed6f8b54ee7cd078b92ac1d21868d273d2d16 --- /dev/null +++ b/annotations_filtered/kglWIEtKSXY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 52.52], [56.0, 73.04], [75.0, 80.92], [81.0, 92.25], [93.0, 112.21]], "keep_status": [false, false, true, true, false], "silence_prob": [58.22, 48.91, 38.74, 41.56, 47.74], "audiomae_on_audioset": [null, [["music", 57.47], ["synthesizer", 8.78], ["gong", 6.4]], [["hum", 25.36], ["music", 23.78], ["mains hum", 20.81]], [["music", 45.71], ["synthesizer", 18.02], ["domestic animals, pets", 5.49]], [["music", 57.1], ["hum", 12.39], ["mains hum", 5.93]]], "duration": [4.52, 17.04, 5.92, 11.25, 19.21]} \ No newline at end of file diff --git a/annotations_filtered/kgu59EAXbic_filtered.json b/annotations_filtered/kgu59EAXbic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa6052e71e815b1fb72ccac0f1184c74e1b777ca --- /dev/null +++ b/annotations_filtered/kgu59EAXbic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 28.63], [30.0, 29.84], [33.0, 33.12], [35.0, 35.82], [38.0, 38.11], [40.0, 40.04], [53.0, 54.97], [56.0, 69.63], [70.0, 71.15], [72.0, 72.91], [78.0, 86.83], [87.0, 92.85], [95.0, 105.33], [106.0, 106.39], [107.0, 106.93], [107.0, 111.57], [112.0, 111.64], [112.0, 115.86], [119.0, 124.14], [125.0, 137.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [29.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.47, 0.0, 0.0, 53.78, 41.98, 51.77, 0.0, 0.0, 47.08, 0.0, 71.57, 65.09, 29.63], "audiomae_on_audioset": [[["speech", 55.82], ["explosion", 18.69], ["burst, pop", 5.28]], null, null, null, null, null, null, [["machine gun", 71.84], ["gunshot, gunfire", 19.9], ["fusillade", 1.2]], null, null, null, [["speech", 54.21], ["music", 8.9], ["hum", 7.22]], null, null, null, [["music", 30.32], ["speech", 29.87], ["electronic music", 3.51]], null, null, null, [["music", 11.35], ["buzz", 10.28], ["fart", 7.79]]], "duration": [10.63, -0.16, 0.12, 0.82, 0.11, 0.04, 1.97, 13.63, 1.15, 0.91, 8.83, 5.85, 10.33, 0.39, -0.07, 4.57, -0.36, 3.86, 5.14, 12.79]} \ No newline at end of file diff --git a/annotations_filtered/kgwjR-pQ29o_filtered.json b/annotations_filtered/kgwjR-pQ29o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532c89c29beeeba1707ba53f923e58ce1fb3ee40 --- /dev/null +++ b/annotations_filtered/kgwjR-pQ29o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [8.0, 8.92], [10.0, 10.81], [15.0, 29.35], [34.0, 37.32], [43.0, 43.23], [46.0, 45.98], [57.0, 57.96], [66.0, 66.72], [67.0, 69.84], [82.0, 82.31], [85.0, 85.83], [87.0, 90.81], [94.0, 97.01], [145.0, 146.31], [149.0, 150.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.31, 31.1, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 28.89, 31.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 47.27], ["music", 26.29], ["vehicle", 4.47]], [["music", 78.07], ["synthesizer", 4.43], ["musical instrument", 3.96]], null, null, null, null, [["speech", 53.53], ["boing", 30.73], ["fart", 2.19]], null, null, [["speech", 53.38], ["vehicle", 15.2], ["car", 5.69]], [["fly, housefly", 19.55], ["hum", 12.25], ["insect", 4.87]], null, null], "duration": [0.5, 0.92, 0.81, 14.35, 3.32, 0.23, -0.02, 0.96, 0.72, 2.84, 0.31, 0.83, 3.81, 3.01, 1.31, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/kh0exWqvxeI_filtered.json b/annotations_filtered/kh0exWqvxeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a1b5209b6d5733075a4dfe4d3a3cebf771d8e5 --- /dev/null +++ b/annotations_filtered/kh0exWqvxeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [5.0, 5.97], [7.0, 7.97], [9.0, 11.45], [13.0, 13.39], [16.0, 17.15], [18.0, 18.55], [19.0, 20.85], [23.0, 26.37], [28.0, 28.83], [29.0, 30.48], [31.0, 32.32], [34.0, 34.4], [37.0, 37.57], [41.0, 41.4], [42.0, 42.7], [43.0, 44.69], [45.0, 46.77], [50.0, 50.46], [52.0, 53.86], [55.0, 57.7], [64.0, 66.55], [70.0, 73.01], [77.0, 79.37], [83.0, 83.88], [89.0, 89.75], [91.0, 94.37], [97.0, 98.68], [99.0, 101.01], [102.0, 102.79], [107.0, 109.11], [112.0, 117.86], [123.0, 123.38], [126.0, 127.74]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 47.31, 38.63, 41.87, 0.0, 0.0, 70.44, 0.0, 46.72, 0.0, 33.23, 45.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 27.76], ["radio", 24.28], ["music", 6.51]], null, null, null, null, [["speech", 53.67], ["radio", 8.33], ["livestock, farm animals, working animals", 4.48]], null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 19.2], ["noise", 13.88], ["hum", 10.45]], [["mains hum", 17.6], ["hum", 12.87], ["mosquito", 11.73]], [["speech", 11.73], ["music", 6.28], ["crowd", 4.56]], null, null, null, null, [["music", 22.41], ["speech", 11.57], ["musical instrument", 3.9]], null, [["speech", 34.78], ["sidetone", 28.8], ["boing", 8.68]], [["noise", 45.24], ["hum", 5.67], ["radio", 5.19]], null, null], "duration": [0.62, 0.97, 0.97, 2.45, 0.39, 1.15, 0.55, 1.85, 3.37, 0.83, 1.48, 1.32, 0.4, 0.57, 0.4, 0.7, 1.69, 1.77, 0.46, 1.86, 2.7, 2.55, 3.01, 2.37, 0.88, 0.75, 3.37, 1.68, 2.01, 0.79, 2.11, 5.86, 0.38, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/kh1sYuFgUAM_filtered.json b/annotations_filtered/kh1sYuFgUAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc7f4c5c4999d675e9f0d88abe1de11bdb2e4339 --- /dev/null +++ b/annotations_filtered/kh1sYuFgUAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [5.0, 7.35], [13.0, 15.15], [16.0, 18.18], [21.0, 25.93], [27.0, 29.76], [32.0, 37.17], [38.0, 48.9], [49.0, 50.18], [54.0, 54.33], [55.0, 60.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.17, 92.48, 93.29, 93.76, 95.37, 90.25, 45.69, 0.0, 0.0, 54.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 68.21], ["ambient music", 8.59], ["synthesizer", 4.46]], null, null, null], "duration": [1.55, 2.35, 2.15, 2.18, 4.93, 2.76, 5.17, 10.9, 1.18, 0.33, 5.49]} \ No newline at end of file diff --git a/annotations_filtered/kh62SjGdI0s_filtered.json b/annotations_filtered/kh62SjGdI0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d002de32d01d442a1d260315d72b70b72fb8389 --- /dev/null +++ b/annotations_filtered/kh62SjGdI0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.57], [15.0, 16.66], [19.0, 20.68], [22.0, 25.61], [28.0, 29.81], [38.0, 39.73], [41.0, 41.13], [42.0, 43.43], [44.0, 44.93], [48.0, 48.49], [53.0, 54.33], [56.0, 57.03], [60.0, 60.45], [61.0, 63.39], [70.0, 70.46], [73.0, 74.46], [78.0, 79.17], [81.0, 81.77], [85.0, 84.57], [85.0, 84.6], [89.0, 90.19], [91.0, 92.3], [97.0, 97.51], [104.0, 104.33], [106.0, 107.15], [116.0, 116.75], [122.0, 121.91], [126.0, 126.74], [129.0, 128.82], [134.0, 140.53], [142.0, 142.64], [144.0, 144.22], [145.0, 146.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.41, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.57, 1.66, 1.68, 3.61, 1.81, 1.73, 0.13, 1.43, 0.93, 0.49, 1.33, 1.03, 0.45, 2.39, 0.46, 1.46, 1.17, 0.77, -0.43, -0.4, 1.19, 1.3, 0.51, 0.33, 1.15, 0.75, -0.09, 0.74, -0.18, 6.53, 0.64, 0.22, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/khX9fjqlf40_filtered.json b/annotations_filtered/khX9fjqlf40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e1d1f37640d20e611971ffab2f20a101f9662dc --- /dev/null +++ b/annotations_filtered/khX9fjqlf40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 6.3], [8.0, 8.41], [14.0, 17.93], [21.0, 22.74], [25.0, 26.72], [29.0, 29.69], [32.0, 32.86], [35.0, 40.46], [41.0, 43.31], [44.0, 46.99], [48.0, 51.41], [52.0, 53.1], [55.0, 57.75], [60.0, 62.83], [65.0, 66.99], [68.0, 69.35], [72.0, 76.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.3, 0.0, 0.0, 0.0, 0.0, 74.76, 60.23, 72.16, 67.63, 0.0, 71.29, 44.96, 0.0, 0.0, 40.24], "audiomae_on_audioset": [null, null, null, [["speech", 49.47], ["hum", 15.12], ["mains hum", 6.71]], null, null, null, null, null, null, null, null, null, null, [["speech", 39.22], ["hum", 15.79], ["whale vocalization", 7.46]], null, null, [["whale vocalization", 90.38], ["hum", 4.57], ["mains hum", 1.25]]], "duration": [0.33, 1.3, 0.41, 3.93, 1.74, 1.72, 0.69, 0.86, 5.46, 2.31, 2.99, 3.41, 1.1, 2.75, 2.83, 1.99, 1.35, 4.87]} \ No newline at end of file diff --git a/annotations_filtered/kheP3iy8-6E_filtered.json b/annotations_filtered/kheP3iy8-6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5650aab3292e0c99d50674ac17c1124336355ca6 --- /dev/null +++ b/annotations_filtered/kheP3iy8-6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.24], [10.0, 10.15], [11.0, 11.85], [13.0, 14.22], [15.0, 15.11], [19.0, 20.01], [20.0, 21.9], [24.0, 24.11], [25.0, 25.71], [27.0, 28.0], [30.0, 30.62], [33.0, 33.22], [34.0, 34.65], [45.0, 44.73], [46.0, 47.34], [52.0, 53.18], [55.0, 55.86], [61.0, 61.16], [63.0, 63.41], [64.0, 67.09], [67.0, 69.28], [70.0, 71.56], [73.0, 73.53], [77.0, 83.96], [88.0, 97.7], [99.0, 99.33], [101.0, 104.43], [108.0, 108.14], [119.0, 119.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 62.89, 0.0, 0.0, 61.57, 38.74, 0.0, 56.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.92], ["brass instrument", 10.79], ["trombone", 8.27]], null, null, null, null], "duration": [5.24, 0.15, 0.85, 1.22, 0.11, 1.01, 1.9, 0.11, 0.71, 1.0, 0.62, 0.22, 0.65, -0.27, 1.34, 1.18, 0.86, 0.16, 0.41, 3.09, 2.28, 1.56, 0.53, 6.96, 9.7, 0.33, 3.43, 0.14, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/khfeRoRCp7c_filtered.json b/annotations_filtered/khfeRoRCp7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5faf07af4dda4d2873969a25a1651322dafaa0f --- /dev/null +++ b/annotations_filtered/khfeRoRCp7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [5.0, 5.19], [6.0, 9.64], [11.0, 13.58], [15.0, 15.97], [17.0, 18.28], [20.0, 21.61], [24.0, 26.22], [27.0, 29.19], [30.0, 30.55], [36.0, 39.45], [47.0, 48.07], [53.0, 58.16], [61.0, 61.94], [63.0, 66.58], [72.0, 77.08], [82.0, 82.49], [83.0, 82.97], [84.0, 84.96], [86.0, 89.94], [92.0, 93.56], [98.0, 113.97], [115.0, 116.87], [118.0, 120.53], [122.0, 125.79], [127.0, 128.51], [130.0, 145.42], [147.0, 146.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 67.63, 99.71, 0.0, 0.0, 0.0, 60.14, 58.72, 0.0, 39.6, 0.0, 35.66, 0.0, 61.67, 34.98, 0.0, 0.0, 0.0, 46.5, 0.0, 60.98, 0.0, 98.19, 98.44, 0.0, 37.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 61.26], ["humming", 5.06], ["singing", 3.37]], null, [["music", 65.37], ["humming", 7.98], ["lullaby", 3.75]], null, null, [["music", 73.61], ["theremin", 14.78], ["opera", 1.94]], null, null, null, [["music", 67.9], ["opera", 4.95], ["theremin", 3.97]], null, null, null, null, null, null, [["electric shaver, electric razor", 34.96], ["music", 20.44], ["hum", 5.57]], null], "duration": [0.92, 0.19, 3.64, 2.58, 0.97, 1.28, 1.61, 2.22, 2.19, 0.55, 3.45, 1.07, 5.16, 0.94, 3.58, 5.08, 0.49, -0.03, 0.96, 3.94, 1.56, 15.97, 1.87, 2.53, 3.79, 1.51, 15.42, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/khg8XoyKzs4_filtered.json b/annotations_filtered/khg8XoyKzs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cc22dfe625c94c7a4aba1a162d039aba7d460d0 --- /dev/null +++ b/annotations_filtered/khg8XoyKzs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.5], [21.0, 22.28], [26.0, 25.73], [28.0, 30.33], [31.0, 32.0], [33.0, 33.69], [39.0, 49.37], [51.0, 53.2], [59.0, 60.13], [67.0, 70.19], [71.0, 71.66], [72.0, 74.82], [78.0, 83.12], [84.0, 86.88], [104.0, 103.89], [105.0, 105.75], [107.0, 107.87], [112.0, 112.73], [121.0, 122.77]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.28, 0.0, 0.0, 33.68, 0.0, 0.0, 32.34, 35.08, 0.0, 33.01, 0.0, 32.82, 32.55, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.06], ["speech", 34.34], ["musical instrument", 2.32]], null, null, [["music", 77.61], ["didgeridoo", 2.97], ["musical instrument", 2.75]], null, null, [["music", 87.58], ["musical instrument", 2.47], ["guitar", 2.23]], [["music", 54.6], ["musical instrument", 8.04], ["guitar", 3.77]], null, [["music", 77.36], ["synthetic singing", 3.27], ["musical instrument", 3.16]], null, [["music", 68.17], ["musical instrument", 3.39], ["guitar", 1.63]], [["music", 77.99], ["musical instrument", 4.13], ["guitar", 3.41]], [["music", 73.24], ["musical instrument", 6.31], ["guitar", 4.7]], null, null, null, null, null], "duration": [2.5, 1.28, -0.27, 2.33, 1.0, 0.69, 10.37, 2.2, 1.13, 3.19, 0.66, 2.82, 5.12, 2.88, -0.11, 0.75, 0.87, 0.73, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/khz9zIg_2sc_filtered.json b/annotations_filtered/khz9zIg_2sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d5feca230216b5023bf7b63bb19f737c4ccf3e4 --- /dev/null +++ b/annotations_filtered/khz9zIg_2sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.23], [17.0, 17.51], [21.0, 31.56], [32.0, 37.13], [37.0, 38.52], [42.0, 42.47], [50.0, 52.03], [67.0, 68.03], [76.0, 76.1], [76.0, 90.32], [93.0, 96.58]], "keep_status": [false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 30.71, 49.45, 0.0, 0.0, 45.69, 0.0, 0.0, 63.53, 39.15], "audiomae_on_audioset": [null, null, [["music", 65.53], ["drum", 3.33], ["swing music", 3.09]], [["speech", 36.27], ["music", 14.06], ["throbbing", 12.11]], null, null, [["speech", 25.82], ["music", 7.11], ["hum", 6.78]], null, null, null, [["speech", 50.21], ["music", 8.76], ["theremin", 4.7]]], "duration": [0.23, 0.51, 10.56, 5.13, 1.52, 0.47, 2.03, 1.03, 0.1, 14.32, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/ki3zzZ-GsGI_filtered.json b/annotations_filtered/ki3zzZ-GsGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e50730b605d427a9d81f5e17b37cff458c57528 --- /dev/null +++ b/annotations_filtered/ki3zzZ-GsGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.92], [21.0, 26.84], [28.0, 62.01], [63.0, 65.64], [67.0, 67.95], [69.0, 72.67], [75.0, 78.66], [82.0, 83.17], [84.0, 85.72], [91.0, 102.52], [104.0, 105.49], [107.0, 107.6], [110.0, 118.72], [122.0, 156.78], [158.0, 158.62], [159.0, 160.1]], "keep_status": [true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.11, 65.44, 0.0, 30.5, 0.0, 30.22, 30.46, 0.0, 0.0, 29.92, 0.0, 0.0, 30.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["applause", 22.77], ["crowd", 19.05], ["speech", 9.91]], null, null, [["music", 55.48], ["trombone", 5.73], ["musical instrument", 4.7]], null, [["music", 43.87], ["reggae", 9.09], ["swing music", 6.45]], [["music", 64.27], ["saxophone", 7.33], ["swing music", 6.93]], null, null, [["music", 72.08], ["musical instrument", 3.54], ["harmonica", 2.06]], null, null, [["music", 79.78], ["brass instrument", 2.34], ["reggae", 1.87]], null, null, null], "duration": [15.92, 5.84, 34.01, 2.64, 0.95, 3.67, 3.66, 1.17, 1.72, 11.52, 1.49, 0.6, 8.72, 34.78, 0.62, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/kiEe33aAucU_filtered.json b/annotations_filtered/kiEe33aAucU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb21935d1c311df2f5a02c13454c92d7a3f215a7 --- /dev/null +++ b/annotations_filtered/kiEe33aAucU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.01], [14.0, 20.97], [23.0, 31.83], [32.0, 51.58]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 32.53, 32.76, 30.46], "audiomae_on_audioset": [null, [["speech", 73.6], ["fireworks", 3.7], ["eruption", 3.14]], [["speech", 79.16], ["animal", 3.97], ["music", 2.69]], [["music", 53.31], ["speech", 23.43], ["hum", 9.0]]], "duration": [0.01, 6.97, 8.83, 19.58]} \ No newline at end of file diff --git a/annotations_filtered/kicjYh3v1FI_filtered.json b/annotations_filtered/kicjYh3v1FI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..437fd53cc681642f131282f9344a3fccca9c845f --- /dev/null +++ b/annotations_filtered/kicjYh3v1FI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [9.0, 9.05], [23.0, 23.13], [31.0, 34.06], [37.0, 37.2], [39.0, 39.63], [40.0, 41.05], [49.0, 50.62], [54.0, 60.42], [64.0, 64.49], [65.0, 66.02], [75.0, 75.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 0.05, 0.13, 3.06, 0.2, 0.63, 1.05, 1.62, 6.42, 0.49, 1.02, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/kjLqB63ihJE_filtered.json b/annotations_filtered/kjLqB63ihJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4265bf6d62e1003bd7da59e2874be61ce129dfa1 --- /dev/null +++ b/annotations_filtered/kjLqB63ihJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.68], [26.0, 49.84], [52.0, 53.94], [55.0, 58.5], [60.0, 64.61], [66.0, 74.92], [79.0, 82.68], [91.0, 93.06], [95.0, 97.43], [99.0, 102.81], [110.0, 111.38], [113.0, 114.54], [115.0, 118.69]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [32.75, 37.49, 0.0, 46.94, 53.4, 30.47, 30.39, 33.57, 49.0, 41.24, 0.0, 0.0, 32.85], "audiomae_on_audioset": [[["hum", 41.08], ["throbbing", 25.91], ["music", 8.3]], [["music", 36.57], ["hum", 29.31], ["throbbing", 22.82]], null, [["music", 50.97], ["speech", 16.83], ["throbbing", 5.76]], null, [["music", 18.86], ["speech", 17.63], ["throbbing", 16.42]], [["music", 68.08], ["musical instrument", 3.63], ["throbbing", 3.15]], [["music", 54.6], ["speech", 26.21], ["throbbing", 5.39]], [["music", 62.31], ["quack", 7.12], ["fart", 3.04]], [["music", 40.83], ["throbbing", 17.62], ["hum", 9.39]], null, null, [["music", 57.33], ["speech", 10.61], ["throbbing", 7.92]]], "duration": [13.68, 23.84, 1.94, 3.5, 4.61, 8.92, 3.68, 2.06, 2.43, 3.81, 1.38, 1.54, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/kjd3eUIBSj0_filtered.json b/annotations_filtered/kjd3eUIBSj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3ba9abf22e5c4cef0ed91e6a176ccc9b43a40bc --- /dev/null +++ b/annotations_filtered/kjd3eUIBSj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.94], [18.0, 18.17], [20.0, 20.78], [25.0, 25.66], [30.0, 30.94], [37.0, 63.21], [68.0, 68.91], [81.0, 80.84]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 88.82], ["synthesizer", 1.65], ["electronic music", 1.27]], null, null], "duration": [0.94, 0.17, 0.78, 0.66, 0.94, 26.21, 0.91, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/kjtPUnPa0LQ_filtered.json b/annotations_filtered/kjtPUnPa0LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2457c0166b620f8d99b4ea11da8df9b287890557 --- /dev/null +++ b/annotations_filtered/kjtPUnPa0LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 135.7], [138.0, 147.65], [148.0, 150.36], [151.0, 150.63], [151.0, 153.06]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 34.68, 46.26, 0.0, 84.07], "audiomae_on_audioset": [null, [["music", 30.61], ["hum", 16.86], ["explosion", 9.22]], [["fly, housefly", 36.72], ["insect", 33.35], ["bee, wasp, etc.", 9.07]], null, null], "duration": [50.7, 9.65, 2.36, -0.37, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/kjzRZCxQ1EE_filtered.json b/annotations_filtered/kjzRZCxQ1EE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20bfa496de138fdabc1ae279863859543b07307a --- /dev/null +++ b/annotations_filtered/kjzRZCxQ1EE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [6.0, 7.59], [11.0, 12.02], [14.0, 14.61], [16.0, 17.58], [18.0, 18.71], [20.0, 20.07], [21.0, 22.2], [24.0, 25.27], [26.0, 26.94], [28.0, 28.31], [30.0, 31.11], [31.0, 32.7], [40.0, 40.73], [42.0, 44.04], [45.0, 46.18], [49.0, 50.63], [51.0, 53.01], [54.0, 54.28], [58.0, 58.68], [60.0, 61.01], [64.0, 64.49], [67.0, 67.44], [69.0, 70.28], [71.0, 71.9], [72.0, 73.68], [75.0, 76.0], [77.0, 77.97], [78.0, 78.98], [81.0, 81.51], [82.0, 83.24], [84.0, 85.43], [86.0, 87.76], [89.0, 91.03], [92.0, 93.6], [96.0, 96.62], [98.0, 97.75], [100.0, 100.72], [102.0, 102.47], [104.0, 104.31], [106.0, 111.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 1.59, 1.02, 0.61, 1.58, 0.71, 0.07, 1.2, 1.27, 0.94, 0.31, 1.11, 1.7, 0.73, 2.04, 1.18, 1.63, 2.01, 0.28, 0.68, 1.01, 0.49, 0.44, 1.28, 0.9, 1.68, 1.0, 0.97, 0.98, 0.51, 1.24, 1.43, 1.76, 2.03, 1.6, 0.62, -0.25, 0.72, 0.47, 0.31, 5.7]} \ No newline at end of file diff --git a/annotations_filtered/kk0vH1qJPHk_filtered.json b/annotations_filtered/kk0vH1qJPHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f4da6b0c88aa31fec27230a657458f9431cb87e --- /dev/null +++ b/annotations_filtered/kk0vH1qJPHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.29], [12.0, 32.44], [36.0, 79.08], [82.0, 92.62], [95.0, 100.94], [102.0, 114.02], [116.0, 118.39]], "keep_status": [false, true, false, false, false, true, true], "silence_prob": [0.0, 31.27, 0.0, 34.66, 65.2, 40.12, 33.22], "audiomae_on_audioset": [null, [["music", 22.15], ["buzz", 18.72], ["vehicle", 5.44]], null, [["gong", 86.18], ["hum", 2.56], ["music", 2.51]], null, [["hum", 34.83], ["music", 16.53], ["mains hum", 13.31]], [["speech", 18.85], ["music", 16.4], ["hum", 13.1]]], "duration": [1.29, 20.44, 43.08, 10.62, 5.94, 12.02, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/kk2HQ0hCGTE_filtered.json b/annotations_filtered/kk2HQ0hCGTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be110b91f2affc7787a52baa2806f820847fc192 --- /dev/null +++ b/annotations_filtered/kk2HQ0hCGTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.69], [9.0, 10.44], [12.0, 12.85], [15.0, 15.3], [21.0, 23.35], [24.0, 27.36], [29.0, 29.52], [31.0, 30.97], [31.0, 31.87], [33.0, 33.62], [35.0, 35.58], [38.0, 41.69], [42.0, 42.42], [43.0, 45.89], [48.0, 48.02], [48.0, 49.35], [52.0, 52.51], [54.0, 55.02], [56.0, 67.0], [68.0, 73.75], [74.0, 74.58], [76.0, 76.76], [79.0, 79.46], [84.0, 85.43], [86.0, 87.84], [89.0, 93.55], [95.0, 95.59], [97.0, 98.42], [100.0, 107.35], [109.0, 109.11], [112.0, 115.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [86.82, 0.0, 0.0, 0.0, 83.16, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 57.72, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 46.61, 0.0, 36.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.44], ["synthesizer", 2.72], ["theremin", 1.77]], null, [["mains hum", 31.56], ["hum", 20.03], ["music", 15.34]]], "duration": [3.69, 1.44, 0.85, 0.3, 2.35, 3.36, 0.52, -0.03, 0.87, 0.62, 0.58, 3.69, 0.42, 2.89, 0.02, 1.35, 0.51, 1.02, 11.0, 5.75, 0.58, 0.76, 0.46, 1.43, 1.84, 4.55, 0.59, 1.42, 7.35, 0.11, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/kk8MNQHBJkY_filtered.json b/annotations_filtered/kk8MNQHBJkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3640b00eec12d0f446c94ce2ddccaf80c0926f23 --- /dev/null +++ b/annotations_filtered/kk8MNQHBJkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.1], [14.0, 14.44], [20.0, 20.8], [23.0, 22.84], [24.0, 24.48], [27.0, 27.26], [29.0, 29.34], [32.0, 32.83], [34.0, 35.19], [50.0, 51.61], [54.0, 54.87], [56.0, 59.0], [60.0, 60.57], [62.0, 62.58], [63.0, 63.76], [69.0, 72.28], [76.0, 85.28], [90.0, 90.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 35.11, 35.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.34], ["mains hum", 18.37], ["hum", 10.56]], [["hum", 53.53], ["mains hum", 26.38], ["throbbing", 7.21]], null], "duration": [1.1, 0.44, 0.8, -0.16, 0.48, 0.26, 0.34, 0.83, 1.19, 1.61, 0.87, 3.0, 0.57, 0.58, 0.76, 3.28, 9.28, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/klnVwzouc_k_filtered.json b/annotations_filtered/klnVwzouc_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..598539a48ebd4f2a72de72c4c54f38daab95c305 --- /dev/null +++ b/annotations_filtered/klnVwzouc_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.51], [10.0, 11.33], [15.0, 20.63], [22.0, 25.27], [26.0, 27.73], [31.0, 42.11], [43.0, 50.77], [55.0, 56.1], [58.0, 59.16], [60.0, 62.4], [65.0, 64.99], [70.0, 70.77], [72.0, 72.22], [74.0, 75.93], [87.0, 87.39], [97.0, 96.85], [100.0, 100.33], [107.0, 108.08], [116.0, 116.61], [122.0, 123.04], [128.0, 129.09], [138.0, 138.92], [144.0, 144.64], [150.0, 150.3], [152.0, 153.32]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.59, 0.0, 96.42, 44.55, 0.0, 99.36, 43.53, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.64], ["thunk", 5.58], ["cello", 5.47]], null, null, [["music", 19.42], ["hum", 16.76], ["mains hum", 15.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.51, 1.33, 5.63, 3.27, 1.73, 11.11, 7.77, 1.1, 1.16, 2.4, -0.01, 0.77, 0.22, 1.93, 0.39, -0.15, 0.33, 1.08, 0.61, 1.04, 1.09, 0.92, 0.64, 0.3, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/klpN-W3Z8Cw_filtered.json b/annotations_filtered/klpN-W3Z8Cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72db48ed7064c22f99dfd8192fbe8b7ded122c78 --- /dev/null +++ b/annotations_filtered/klpN-W3Z8Cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 37.91], [40.0, 45.15], [46.0, 59.56], [60.0, 81.24], [84.0, 96.33], [97.0, 97.71], [98.0, 99.94], [100.0, 117.19], [118.0, 119.25], [120.0, 123.72]], "keep_status": [true, false, true, true, true, false, false, true, false, false], "silence_prob": [31.34, 31.91, 31.19, 31.2, 30.84, 0.0, 0.0, 31.91, 0.0, 33.83], "audiomae_on_audioset": [[["music", 53.57], ["cacophony", 7.97], ["throbbing", 7.2]], [["music", 35.98], ["speech", 30.12], ["mains hum", 8.88]], [["cacophony", 33.08], ["music", 23.9], ["throbbing", 6.69]], [["music", 30.39], ["speech", 22.68], ["machine gun", 10.96]], [["music", 36.14], ["machine gun", 20.2], ["cacophony", 9.56]], null, null, [["music", 35.53], ["speech", 12.28], ["hum", 7.37]], null, [["music", 40.5], ["throbbing", 16.05], ["pulse", 14.44]]], "duration": [17.91, 5.15, 13.56, 21.24, 12.33, 0.71, 1.94, 17.19, 1.25, 3.72]} \ No newline at end of file diff --git a/annotations_filtered/klt86blKwaA_filtered.json b/annotations_filtered/klt86blKwaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a679ddab6ec10813b431ab3550573251d9ffcc --- /dev/null +++ b/annotations_filtered/klt86blKwaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.88], [12.0, 17.49], [19.0, 19.52], [28.0, 29.74], [31.0, 31.8], [37.0, 37.27], [43.0, 44.93], [48.0, 48.05], [49.0, 49.81], [58.0, 69.2], [77.0, 77.23], [78.0, 78.39], [79.0, 79.12], [82.0, 82.7], [85.0, 84.91], [86.0, 86.71], [88.0, 89.07], [91.0, 91.98], [93.0, 92.94], [94.0, 96.13], [97.0, 98.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 5.49, 0.52, 1.74, 0.8, 0.27, 1.93, 0.05, 0.81, 11.2, 0.23, 0.39, 0.12, 0.7, -0.09, 0.71, 1.07, 0.98, -0.06, 2.13, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/km3VtR6mqmg_filtered.json b/annotations_filtered/km3VtR6mqmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c58a43e5a8cff9351edf4e0ce24dafeabafeddc --- /dev/null +++ b/annotations_filtered/km3VtR6mqmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.61], [3.0, 2.74], [3.0, 2.89], [6.0, 18.66], [26.0, 50.84], [56.0, 90.19], [91.0, 94.39], [96.0, 102.2], [106.0, 107.74], [108.0, 107.77], [108.0, 108.33], [109.0, 111.57], [112.0, 113.36], [114.0, 128.39], [130.0, 132.38]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.12, 30.97, 0.0, 36.83, 30.02, 0.0, 0.0, 0.0, 36.2, 0.0, 30.3, 32.81], "audiomae_on_audioset": [null, null, null, [["music", 33.57], ["skidding", 22.02], ["vehicle", 16.49]], [["music", 44.11], ["throbbing", 14.74], ["vehicle", 7.88]], null, [["hum", 37.61], ["speech", 17.74], ["mains hum", 15.12]], [["music", 23.78], ["hum", 15.62], ["throbbing", 15.46]], null, null, null, [["music", 62.96], ["throbbing", 17.68], ["hum", 9.71]], null, [["music", 66.06], ["vehicle", 6.61], ["speech", 3.82]], [["music", 47.26], ["hum", 16.65], ["throbbing", 14.79]]], "duration": [-0.39, -0.26, -0.11, 12.66, 24.84, 34.19, 3.39, 6.2, 1.74, -0.23, 0.33, 2.57, 1.36, 14.39, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/km7CMB9s8ok_filtered.json b/annotations_filtered/km7CMB9s8ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8050dff27b1e1d11796a5c60db3cc2cdcf4c91 --- /dev/null +++ b/annotations_filtered/km7CMB9s8ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [11.0, 11.8], [13.0, 13.36], [18.0, 17.85], [20.0, 20.56], [21.0, 21.3], [23.0, 24.78], [31.0, 33.0], [35.0, 36.26], [37.0, 39.18], [48.0, 48.32], [49.0, 49.4], [51.0, 51.93], [52.0, 63.41], [97.0, 97.65], [98.0, 98.17], [98.0, 98.39], [98.0, 98.42], [98.0, 98.69], [99.0, 104.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 91.47, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.8, 0.36, -0.15, 0.56, 0.3, 1.78, 2.0, 1.26, 2.18, 0.32, 0.4, 0.93, 11.41, 0.65, 0.17, 0.39, 0.42, 0.69, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/kmgRv2V_7P4_filtered.json b/annotations_filtered/kmgRv2V_7P4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9054ef8023ee7ba6f8295798dc561f8e748b4660 --- /dev/null +++ b/annotations_filtered/kmgRv2V_7P4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.74], [21.0, 37.37], [47.0, 48.95], [57.0, 57.57], [92.0, 93.39], [97.0, 97.39], [103.0, 103.91], [107.0, 108.24], [110.0, 114.56], [116.0, 120.06]], "keep_status": [false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 29.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.75, 55.81], "audiomae_on_audioset": [null, [["music", 31.58], ["hum", 22.27], ["speech", 15.23]], null, null, null, null, null, null, [["hum", 32.78], ["mains hum", 15.99], ["wind chime", 4.63]], null], "duration": [1.74, 16.37, 1.95, 0.57, 1.39, 0.39, 0.91, 1.24, 4.56, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/kmjblNu2_6M_filtered.json b/annotations_filtered/kmjblNu2_6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e58bfce9141958991e593148b47181e5215fa6b --- /dev/null +++ b/annotations_filtered/kmjblNu2_6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [7.0, 13.12], [14.0, 14.98], [18.0, 19.43], [25.0, 28.54], [32.0, 49.74], [53.0, 53.77], [55.0, 67.29], [69.0, 71.71], [76.0, 80.38], [83.0, 112.09], [113.0, 122.94]], "keep_status": [false, true, false, false, true, false, false, false, true, false, false, true], "silence_prob": [93.45, 36.6, 0.0, 0.0, 30.18, 31.91, 0.0, 30.85, 30.74, 31.83, 31.03, 34.36], "audiomae_on_audioset": [null, [["music", 16.22], ["thunk", 10.18], ["speech", 9.32]], null, null, [["music", 28.6], ["speech", 22.01], ["fart", 12.81]], [["music", 44.64], ["speech", 32.16], ["fart", 8.69]], null, [["music", 66.79], ["speech", 7.47], ["musical instrument", 2.97]], [["music", 27.06], ["speech", 22.85], ["explosion", 7.79]], [["music", 43.66], ["speech", 26.82], ["boing", 3.17]], [["music", 38.45], ["speech", 32.02], ["didgeridoo", 4.0]], [["music", 29.62], ["throbbing", 11.79], ["speech", 10.37]]], "duration": [2.45, 6.12, 0.98, 1.43, 3.54, 17.74, 0.77, 12.29, 2.71, 4.38, 29.09, 9.94]} \ No newline at end of file diff --git a/annotations_filtered/kmr68ZevIrM_filtered.json b/annotations_filtered/kmr68ZevIrM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e4b0d076544a42f2ceee6983570f4bbb8f2a65c --- /dev/null +++ b/annotations_filtered/kmr68ZevIrM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [4.0, 6.52], [9.0, 8.82], [11.0, 13.64], [15.0, 15.3], [20.0, 20.58], [22.0, 22.74], [24.0, 23.87], [25.0, 25.89], [29.0, 31.28], [39.0, 40.86], [44.0, 49.0], [51.0, 52.0], [54.0, 53.94], [55.0, 55.71], [58.0, 58.29], [62.0, 62.09], [64.0, 64.83], [66.0, 67.95], [72.0, 73.3], [88.0, 88.21], [95.0, 96.09], [99.0, 100.11], [104.0, 104.36], [106.0, 107.69], [109.0, 109.63], [116.0, 117.96], [122.0, 122.74], [131.0, 132.07], [135.0, 137.24], [139.0, 139.06], [141.0, 141.51], [144.0, 144.24], [146.0, 145.61], [148.0, 149.84], [151.0, 154.7], [157.0, 157.77], [160.0, 161.47], [164.0, 166.46], [168.0, 168.24], [170.0, 171.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.98, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 93.45, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 2.52, -0.18, 2.64, 0.3, 0.58, 0.74, -0.13, 0.89, 2.28, 1.86, 5.0, 1.0, -0.06, 0.71, 0.29, 0.09, 0.83, 1.95, 1.3, 0.21, 1.09, 1.11, 0.36, 1.69, 0.63, 1.96, 0.74, 1.07, 2.24, 0.06, 0.51, 0.24, -0.39, 1.84, 3.7, 0.77, 1.47, 2.46, 0.24, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/kn5Sc8o9YTM_filtered.json b/annotations_filtered/kn5Sc8o9YTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d93969d00524eae5c281d63c01aea389d645970 --- /dev/null +++ b/annotations_filtered/kn5Sc8o9YTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 8.01], [10.0, 11.65], [12.0, 13.19], [15.0, 15.45], [19.0, 19.95], [20.0, 21.68], [27.0, 31.13], [32.0, 33.67], [40.0, 40.53], [49.0, 50.53], [58.0, 62.04], [63.0, 64.07], [64.0, 64.77], [66.0, 66.83], [68.0, 69.28], [70.0, 71.51], [73.0, 73.38], [74.0, 74.38], [75.0, 75.88], [78.0, 78.8], [81.0, 81.84], [83.0, 84.25], [90.0, 91.18], [92.0, 92.37], [94.0, 94.76], [95.0, 96.58], [99.0, 100.28], [103.0, 105.21], [107.0, 108.67], [112.0, 112.77], [129.0, 129.91], [137.0, 138.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.76], ["music", 19.3], ["hum", 7.77]], null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 27.17], ["cattle, bovinae", 23.86], ["moo", 18.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 34.07], ["cattle, bovinae", 31.59], ["music", 11.23]], null, null, null, null], "duration": [0.66, 5.01, 1.65, 1.19, 0.45, 0.95, 1.68, 4.13, 1.67, 0.53, 1.53, 4.04, 1.07, 0.77, 0.83, 1.28, 1.51, 0.38, 0.38, 0.88, 0.8, 0.84, 1.25, 1.18, 0.37, 0.76, 1.58, 1.28, 2.21, 1.67, 0.77, 0.91, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/kn8k_ox5OXs_filtered.json b/annotations_filtered/kn8k_ox5OXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b400ac6ef875deef23b694b3ae5eceaf3e96a17 --- /dev/null +++ b/annotations_filtered/kn8k_ox5OXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.66], [18.0, 32.29], [36.0, 38.3], [40.0, 50.01], [51.0, 52.35], [53.0, 52.84], [53.0, 53.0], [53.0, 55.34], [56.0, 56.88], [63.0, 64.47], [67.0, 78.58], [81.0, 97.46], [101.0, 107.06], [108.0, 111.91], [115.0, 115.1], [117.0, 117.09], [121.0, 121.54], [123.0, 123.94], [125.0, 132.22], [134.0, 149.37], [151.0, 163.14]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [41.18, 36.01, 35.59, 36.17, 0.0, 0.0, 0.0, 38.4, 0.0, 0.0, 33.29, 32.09, 32.92, 56.55, 0.0, 0.0, 0.0, 0.0, 39.99, 32.92, 31.6], "audiomae_on_audioset": [[["music", 64.74], ["didgeridoo", 11.36], ["musical instrument", 8.03]], [["music", 40.31], ["hum", 14.26], ["mains hum", 6.46]], [["music", 34.92], ["hum", 22.39], ["throbbing", 7.14]], [["music", 62.4], ["theremin", 12.16], ["hum", 5.94]], null, null, null, [["music", 64.49], ["speech", 6.45], ["musical instrument", 3.79]], null, null, [["music", 69.68], ["theremin", 5.64], ["electronic music", 5.23]], [["throbbing", 39.31], ["hum", 27.91], ["music", 20.49]], [["music", 53.25], ["throbbing", 6.82], ["ambient music", 5.98]], null, null, null, null, null, [["mains hum", 36.62], ["hum", 19.6], ["music", 16.37]], [["music", 29.16], ["hum", 21.48], ["speech", 11.74]], [["music", 66.89], ["cello", 3.61], ["bowed string instrument", 2.59]]], "duration": [6.66, 14.29, 2.3, 10.01, 1.35, -0.16, 0.0, 2.34, 0.88, 1.47, 11.58, 16.46, 6.06, 3.91, 0.1, 0.09, 0.54, 0.94, 7.22, 15.37, 12.14]} \ No newline at end of file diff --git a/annotations_filtered/knJ438gN25k_filtered.json b/annotations_filtered/knJ438gN25k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ceb7a680ac45ba5815ddf4064351c7aecf2eed --- /dev/null +++ b/annotations_filtered/knJ438gN25k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.01], [14.0, 14.27], [20.0, 20.34], [24.0, 24.6], [25.0, 25.68], [28.0, 38.16], [39.0, 39.36], [42.0, 69.84], [71.0, 77.82], [80.0, 80.08], [80.0, 80.67]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.54, 0.0, 41.85, 46.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 21.3], ["hum", 20.85], ["mains hum", 9.88]], null, [["music", 49.83], ["flute", 6.59], ["wind instrument, woodwind instrument", 4.73]], [["music", 53.13], ["musical instrument", 3.75], ["theremin", 3.18]], null, null], "duration": [1.01, 0.27, 0.34, 0.6, 0.68, 10.16, 0.36, 27.84, 6.82, 0.08, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/knL5zY1LRqw_filtered.json b/annotations_filtered/knL5zY1LRqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f19684697a1b01140f97f0760f98b8cab716b31 --- /dev/null +++ b/annotations_filtered/knL5zY1LRqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.77], [13.0, 15.57], [17.0, 17.39], [21.0, 21.51], [26.0, 30.91], [35.0, 35.16], [37.0, 38.25], [39.0, 40.71], [43.0, 43.26], [45.0, 46.26], [47.0, 49.08], [50.0, 51.07], [51.0, 52.37], [53.0, 53.45], [63.0, 63.95], [65.0, 67.17], [71.0, 71.59], [77.0, 80.57], [82.0, 82.36], [89.0, 92.89], [94.0, 94.73], [99.0, 99.17], [116.0, 116.33], [127.0, 127.43]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 62.07, 0.0, 0.0, 30.72, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81, 0.0, 0.0, 0.0, 0.0, 42.26, 0.0, 31.01, 0.0, 33.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["tuning fork", 15.09], ["music", 12.32], ["sound effect", 9.92]], null, null, null, null, null, null, null, null, null, null, [["music", 22.83], ["throbbing", 22.43], ["hum", 11.11]], null, [["music", 67.69], ["frog", 4.05], ["musical instrument", 3.74]], null, [["thunk", 30.67], ["stomach rumble", 17.58], ["music", 14.3]], null, null, null, null], "duration": [1.77, 2.57, 0.39, 0.51, 4.91, 0.16, 1.25, 1.71, 0.26, 1.26, 2.08, 1.07, 1.37, 0.45, 0.95, 2.17, 0.59, 3.57, 0.36, 3.89, 0.73, 0.17, 0.33, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/kndeWhsNlJs_filtered.json b/annotations_filtered/kndeWhsNlJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c88eb13346cbccce33abba2f3db98c2a72ce13c --- /dev/null +++ b/annotations_filtered/kndeWhsNlJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.27], [27.0, 34.91], [35.0, 37.89], [39.0, 46.13], [47.0, 47.66], [49.0, 54.68], [56.0, 83.25], [84.0, 93.07], [93.0, 106.81]], "keep_status": [true, true, true, false, false, false, false, false, true], "silence_prob": [31.14, 32.42, 31.4, 39.33, 0.0, 30.99, 30.93, 60.89, 29.56], "audiomae_on_audioset": [[["music", 26.4], ["mains hum", 22.18], ["hum", 19.79]], [["didgeridoo", 30.29], ["music", 24.04], ["musical instrument", 6.59]], [["speech", 34.12], ["music", 16.65], ["didgeridoo", 10.41]], [["music", 55.93], ["didgeridoo", 11.42], ["musical instrument", 4.93]], null, [["music", 83.61], ["musical instrument", 4.02], ["guitar", 2.8]], [["music", 60.2], ["didgeridoo", 12.35], ["musical instrument", 6.52]], null, [["music", 28.39], ["mains hum", 17.26], ["hum", 8.75]]], "duration": [19.27, 7.91, 2.89, 7.13, 0.66, 5.68, 27.25, 9.07, 13.81]} \ No newline at end of file diff --git a/annotations_filtered/kntQNeSge5s_filtered.json b/annotations_filtered/kntQNeSge5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e24fbf30bf462a9dc04cec5388e6e1becc3c23e8 --- /dev/null +++ b/annotations_filtered/kntQNeSge5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.92], [31.0, 31.55], [33.0, 37.2], [43.0, 44.73], [66.0, 71.76], [78.0, 78.93], [86.0, 86.34], [91.0, 91.62], [93.0, 93.6], [104.0, 130.18], [133.0, 135.01], [136.0, 141.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.44, 0.0, 31.07, 0.0, 0.0, 0.0, 0.0, 30.83, 77.36, 43.69], "audiomae_on_audioset": [null, null, [["music", 76.4], ["crowd", 2.13], ["musical instrument", 2.04]], null, [["music", 84.28], ["electronic music", 1.81], ["throbbing", 1.8]], null, null, null, null, [["music", 89.05], ["electronic music", 1.48], ["house music", 0.79]], null, [["hum", 56.06], ["mains hum", 17.22], ["throbbing", 10.34]]], "duration": [0.92, 0.55, 4.2, 1.73, 5.76, 0.93, 0.34, 0.62, 0.6, 26.18, 2.01, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/koPEnaz0Qm8_filtered.json b/annotations_filtered/koPEnaz0Qm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5337fff59f6d981eb7a06b54013646128e6d2659 --- /dev/null +++ b/annotations_filtered/koPEnaz0Qm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.1], [11.0, 12.46], [19.0, 33.27], [35.0, 36.54], [41.0, 42.53], [46.0, 46.47], [48.0, 48.63], [50.0, 50.26], [51.0, 51.17]], "keep_status": [true, false, true, false, false, false, false, false, false], "silence_prob": [31.56, 0.0, 31.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.98], ["fart", 12.37], ["cacophony", 7.47]], null, [["speech", 47.66], ["music", 15.16], ["buzz", 7.0]], null, null, null, null, null, null], "duration": [2.1, 1.46, 14.27, 1.54, 1.53, 0.47, 0.63, 0.26, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/koWVPnRRGlA_filtered.json b/annotations_filtered/koWVPnRRGlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2c99e344f22cf5373120830184d6c088fc34f5a --- /dev/null +++ b/annotations_filtered/koWVPnRRGlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [8.0, 18.77], [21.0, 100.28], [101.0, 101.55], [102.0, 102.64], [104.0, 106.2], [108.0, 109.49], [110.0, 110.4]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.8, 0.0, 0.0, 0.0, 41.52, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 84.42], ["explosion", 4.39], ["burst, pop", 1.88]], null, null, null, [["beatboxing", 71.81], ["music", 5.04], ["vocal music", 4.59]], null, null], "duration": [0.97, 10.77, 79.28, 0.55, 0.64, 2.2, 1.49, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/koWhZSL1Kwo_filtered.json b/annotations_filtered/koWhZSL1Kwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae006cd0ff6c35added2ce2cb61c71bdc0ad782e --- /dev/null +++ b/annotations_filtered/koWhZSL1Kwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.1], [10.0, 10.05], [33.0, 33.03], [35.0, 35.88], [37.0, 37.39], [40.0, 40.17], [42.0, 42.31], [59.0, 62.16], [68.0, 70.85], [71.0, 71.32], [72.0, 72.17], [72.0, 73.43], [75.0, 75.24], [76.0, 76.38], [81.0, 81.14], [83.0, 89.23], [93.0, 96.43], [97.0, 101.6], [102.0, 104.87], [105.0, 116.04], [118.0, 118.18], [122.0, 123.08], [129.0, 129.41], [134.0, 134.15]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 40.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 80.11, 57.81, 69.88, 37.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 18.35], ["roaring cats (lions, tigers)", 15.65], ["whale vocalization", 14.59]], null, null, null, null, null, null, [["music", 42.52], ["theremin", 12.47], ["animal", 6.37]], null, null, null, [["grunt", 20.22], ["music", 7.77], ["sound effect", 7.22]], null, null, null, null], "duration": [4.1, 0.05, 0.03, 0.88, 0.39, 0.17, 0.31, 3.16, 2.85, 0.32, 0.17, 1.43, 0.24, 0.38, 0.14, 6.23, 3.43, 4.6, 2.87, 11.04, 0.18, 1.08, 0.41, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/koX0RDUQHFs_filtered.json b/annotations_filtered/koX0RDUQHFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b7832d14d19a314e076a73de4de41cb3aec644 --- /dev/null +++ b/annotations_filtered/koX0RDUQHFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 25.95], [26.0, 27.03], [29.0, 29.12], [30.0, 37.44], [46.0, 51.49], [54.0, 54.58], [56.0, 55.93], [58.0, 58.9], [60.0, 59.95], [63.0, 62.87], [64.0, 65.21], [68.0, 72.37], [75.0, 74.82], [77.0, 77.52], [81.0, 86.46], [87.0, 88.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.3, 0.0, 0.0, 53.72, 67.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 81.89, 0.0], "audiomae_on_audioset": [[["music", 31.13], ["speech", 22.57], ["synthesizer", 21.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [23.95, 1.03, 0.12, 7.44, 5.49, 0.58, -0.07, 0.9, -0.05, -0.13, 1.21, 4.37, -0.18, 0.52, 5.46, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/koZie6TLz3s_filtered.json b/annotations_filtered/koZie6TLz3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee5d533b4d40b00d279dbdbc66fccdb77c3f4f1 --- /dev/null +++ b/annotations_filtered/koZie6TLz3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.21], [13.0, 12.93], [16.0, 16.06], [17.0, 17.17], [17.0, 17.78], [20.0, 20.71], [22.0, 22.05], [22.0, 22.72], [25.0, 25.34], [25.0, 25.46], [26.0, 26.49], [27.0, 28.16], [30.0, 31.78], [33.0, 34.77], [39.0, 39.26], [46.0, 45.66], [47.0, 48.69], [50.0, 52.0], [54.0, 54.06], [80.0, 81.63], [90.0, 90.07], [125.0, 125.78], [143.0, 143.78], [145.0, 146.31], [147.0, 153.96], [155.0, 156.61], [157.0, 157.71], [167.0, 168.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, -0.07, 0.06, 0.17, 0.78, 0.71, 0.05, 0.72, 0.34, 0.46, 0.49, 1.16, 1.78, 1.77, 0.26, -0.34, 1.69, 2.0, 0.06, 1.63, 0.07, 0.78, 0.78, 1.31, 6.96, 1.61, 0.71, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/kokQDLJ1104_filtered.json b/annotations_filtered/kokQDLJ1104_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kokQDLJ1104_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/komxaWgJ8O4_filtered.json b/annotations_filtered/komxaWgJ8O4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec3130ec5a64853e269be89a06db18c89aa6984a --- /dev/null +++ b/annotations_filtered/komxaWgJ8O4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.04], [21.0, 21.24], [22.0, 48.93], [50.0, 50.38], [52.0, 53.59], [55.0, 91.99], [94.0, 102.29], [104.0, 126.08], [127.0, 136.44], [138.0, 145.89]], "keep_status": [true, false, false, false, false, false, true, false, true, true], "silence_prob": [43.25, 0.0, 34.43, 0.0, 0.0, 0.0, 31.53, 31.67, 39.34, 37.27], "audiomae_on_audioset": [[["music", 48.7], ["hum", 8.34], ["speech", 6.34]], null, [["music", 48.43], ["didgeridoo", 16.63], ["buzz", 7.92]], null, null, null, [["speech", 20.01], ["fly, housefly", 19.71], ["music", 18.41]], [["speech", 65.14], ["vehicle", 5.45], ["music", 4.51]], [["music", 23.41], ["hum", 17.4], ["electric shaver, electric razor", 8.37]], [["fly, housefly", 20.38], ["buzz", 16.42], ["insect", 12.83]]], "duration": [5.04, 0.24, 26.93, 0.38, 1.59, 36.99, 8.29, 22.08, 9.44, 7.89]} \ No newline at end of file diff --git a/annotations_filtered/kp2UhFQQb_k_filtered.json b/annotations_filtered/kp2UhFQQb_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7a101faf43d7b9beb5e7cc155e89af89dc95549 --- /dev/null +++ b/annotations_filtered/kp2UhFQQb_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.66], [12.0, 13.78], [18.0, 19.21], [22.0, 23.45], [25.0, 25.88], [27.0, 27.57]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.66, 1.78, 1.21, 1.45, 0.88, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/kp3HaaTqYP0_filtered.json b/annotations_filtered/kp3HaaTqYP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbfd2bc9a7b0873701672c959222523b7f967398 --- /dev/null +++ b/annotations_filtered/kp3HaaTqYP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.91], [9.0, 14.99], [15.0, 23.41], [28.0, 39.51], [42.0, 63.56], [65.0, 65.5], [69.0, 81.14], [83.0, 83.52], [86.0, 100.45], [106.0, 107.08], [108.0, 110.46], [111.0, 127.7]], "keep_status": [false, false, true, true, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 32.1, 31.97, 31.16, 31.82, 0.0, 33.14, 0.0, 35.26, 0.0, 63.96, 31.13], "audiomae_on_audioset": [null, [["music", 40.25], ["boing", 26.54], ["speech", 16.33]], [["music", 31.1], ["speech", 13.02], ["fly, housefly", 9.21]], [["music", 57.25], ["speech", 3.59], ["musical instrument", 3.37]], [["music", 67.72], ["throbbing", 6.81], ["smash, crash", 5.21]], null, [["music", 21.08], ["speech", 19.63], ["cacophony", 17.12]], null, [["music", 27.66], ["theremin", 11.61], ["hum", 5.2]], null, null, [["music", 55.84], ["didgeridoo", 6.86], ["speech", 3.13]]], "duration": [1.91, 5.99, 8.41, 11.51, 21.56, 0.5, 12.14, 0.52, 14.45, 1.08, 2.46, 16.7]} \ No newline at end of file diff --git a/annotations_filtered/kpFSJhQ_30c_filtered.json b/annotations_filtered/kpFSJhQ_30c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdfe69110d837a068441ffcf16421a2af9ec6eb --- /dev/null +++ b/annotations_filtered/kpFSJhQ_30c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.08], [17.0, 22.17], [24.0, 24.49], [27.0, 27.87], [31.0, 31.87], [33.0, 95.32], [95.0, 95.4], [95.0, 96.31], [97.0, 116.09], [126.0, 127.31], [131.0, 131.58], [142.0, 142.69]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.84, 31.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.9], ["music", 17.61], ["vehicle", 7.63]], [["cattle, bovinae", 44.25], ["livestock, farm animals, working animals", 29.92], ["moo", 22.94]], null, null, null, null, null, null, [["speech", 34.55], ["vehicle", 22.33], ["motorcycle", 6.8]], null, null, null], "duration": [5.08, 5.17, 0.49, 0.87, 0.87, 62.32, 0.4, 1.31, 19.09, 1.31, 0.58, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/kpS1Pghejt8_filtered.json b/annotations_filtered/kpS1Pghejt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62c8e1fb5d61aea8baa81a80c8700ae5dadcbc89 --- /dev/null +++ b/annotations_filtered/kpS1Pghejt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 58.75]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [-0.25]} \ No newline at end of file diff --git a/annotations_filtered/kpYZ4G1AQ0c_filtered.json b/annotations_filtered/kpYZ4G1AQ0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7531ddad88061528d66d31e69a7fd91c8be2bd5d --- /dev/null +++ b/annotations_filtered/kpYZ4G1AQ0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [21.0, 22.6], [24.0, 26.92], [31.0, 37.03], [37.0, 38.15], [39.0, 49.49], [54.0, 54.68], [55.0, 66.99], [68.0, 76.44], [79.0, 80.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.43, 57.09, 0.0, 61.67, 0.0, 58.05, 60.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.6, 2.92, 6.03, 1.15, 10.49, 0.68, 11.99, 8.44, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/kpjWox_c9Ig_filtered.json b/annotations_filtered/kpjWox_c9Ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1f13fe20a18d5cab65a1076ab0091c2b6068a32 --- /dev/null +++ b/annotations_filtered/kpjWox_c9Ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.95], [19.0, 21.71], [22.0, 24.75], [26.0, 27.46], [29.0, 30.32], [31.0, 32.78], [35.0, 35.5], [36.0, 37.23], [38.0, 39.46], [40.0, 43.95], [44.0, 45.76], [48.0, 48.37], [49.0, 49.79], [51.0, 52.68], [54.0, 54.82], [56.0, 57.0], [58.0, 59.58], [61.0, 61.6], [63.0, 64.0], [65.0, 64.99], [66.0, 67.56], [68.0, 69.62], [71.0, 71.39], [73.0, 73.04], [75.0, 75.2], [75.0, 78.06], [78.0, 79.2], [80.0, 81.13], [82.0, 83.84], [86.0, 87.59], [92.0, 93.5], [96.0, 96.06], [98.0, 99.01], [100.0, 100.84], [101.0, 101.6], [103.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 100.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 26.46], ["music", 25.36], ["speech", 9.65]]], "duration": [1.95, 2.71, 2.75, 1.46, 1.32, 1.78, 0.5, 1.23, 1.46, 3.95, 1.76, 0.37, 0.79, 1.68, 0.82, 1.0, 1.58, 0.6, 1.0, -0.01, 1.56, 1.62, 0.39, 0.04, 0.2, 3.06, 1.2, 1.13, 1.84, 1.59, 1.5, 0.06, 1.01, 0.84, 0.6, 9.21]} \ No newline at end of file diff --git a/annotations_filtered/kptIt3LwGWc_filtered.json b/annotations_filtered/kptIt3LwGWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa0a939c4c7e9978a46ddfe0eebbd2a2a7cb1d5b --- /dev/null +++ b/annotations_filtered/kptIt3LwGWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [8.0, 7.82], [9.0, 9.69], [10.0, 15.23], [19.0, 20.38], [21.0, 22.03], [26.0, 26.67], [28.0, 28.81], [30.0, 33.39], [34.0, 36.26], [37.0, 39.43], [41.0, 49.35], [52.0, 62.99], [64.0, 64.99], [69.0, 69.36], [70.0, 72.44], [83.0, 89.55], [94.0, 94.98], [96.0, 96.06], [97.0, 97.09], [101.0, 101.09], [102.0, 116.14], [118.0, 117.64], [118.0, 119.74], [123.0, 127.5], [129.0, 129.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 58.81, 87.37, 97.73, 74.13, 64.75, 0.0, 0.0, 95.91, 42.79, 0.0, 0.0, 0.0, 0.0, 40.12, 0.0, 0.0, 69.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.25], ["theremin", 17.47], ["speech", 15.67]], null, null, null, null, [["music", 30.44], ["speech", 16.83], ["theremin", 8.04]], null, null, null, null], "duration": [0.51, -0.18, 0.69, 5.23, 1.38, 1.03, 0.67, 0.81, 3.39, 2.26, 2.43, 8.35, 10.99, 0.99, 0.36, 2.44, 6.55, 0.98, 0.06, 0.09, 0.09, 14.14, -0.36, 1.74, 4.5, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/kq-GLDVKqMU_filtered.json b/annotations_filtered/kq-GLDVKqMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5c56c9c49bbe29b2dfc3b26492d3ce8e16979e --- /dev/null +++ b/annotations_filtered/kq-GLDVKqMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.13], [20.0, 20.95], [23.0, 23.79], [28.0, 28.48], [29.0, 29.89], [38.0, 39.58], [42.0, 43.14], [44.0, 61.38], [63.0, 65.91], [68.0, 69.92], [74.0, 78.16], [84.0, 86.76], [88.0, 94.73]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.67, 40.68, 0.0, 31.98, 32.01, 87.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["gong", 40.28], ["music", 21.2], ["hum", 15.42]], [["music", 38.14], ["hum", 22.08], ["mains hum", 4.23]], null, [["music", 73.6], ["throbbing", 11.52], ["hum", 3.52]], [["music", 43.51], ["throbbing", 4.3], ["synthesizer", 4.22]], null], "duration": [0.13, 0.95, 0.79, 0.48, 0.89, 1.58, 1.14, 17.38, 2.91, 1.92, 4.16, 2.76, 6.73]} \ No newline at end of file diff --git a/annotations_filtered/kq0YESApfvs_filtered.json b/annotations_filtered/kq0YESApfvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8b2ac7d80bbe9efc07fbaf10000c0ec9f9bf6c --- /dev/null +++ b/annotations_filtered/kq0YESApfvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 53.99], [56.0, 64.94], [67.0, 68.5], [74.0, 74.31], [76.0, 77.6]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 35.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.68], ["sidetone", 8.03], ["synthesizer", 5.86]], null, null, null], "duration": [36.99, 8.94, 1.5, 0.31, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/kqBMHRX-c-4_filtered.json b/annotations_filtered/kqBMHRX-c-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ace522b73e148434aff52778646d545e5cc768 --- /dev/null +++ b/annotations_filtered/kqBMHRX-c-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [9.0, 9.44], [11.0, 11.25], [14.0, 15.9], [18.0, 18.52], [20.0, 20.14], [28.0, 29.73], [35.0, 35.36], [40.0, 40.41], [45.0, 45.2], [50.0, 50.5], [53.0, 53.47], [59.0, 60.3], [61.0, 62.14], [67.0, 67.2], [74.0, 75.02], [78.0, 79.02], [84.0, 85.08], [88.0, 88.26], [92.0, 92.11], [94.0, 94.36], [101.0, 101.85], [103.0, 104.04], [107.0, 107.57], [133.0, 133.42], [136.0, 137.32], [143.0, 143.94], [149.0, 149.3], [151.0, 151.6], [160.0, 160.54], [162.0, 162.51], [165.0, 166.06], [172.0, 173.58], [175.0, 179.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.44, 0.25, 1.9, 0.52, 0.14, 1.73, 0.36, 0.41, 0.2, 0.5, 0.47, 1.3, 1.14, 0.2, 1.02, 1.02, 1.08, 0.26, 0.11, 0.36, 0.85, 1.04, 0.57, 0.42, 1.32, 0.94, 0.3, 0.6, 0.54, 0.51, 1.06, 1.58, 4.37]} \ No newline at end of file diff --git a/annotations_filtered/kqFgnN10khg_filtered.json b/annotations_filtered/kqFgnN10khg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..665bb053537e1646bbbdd9b067c06c1d5dc89794 --- /dev/null +++ b/annotations_filtered/kqFgnN10khg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.81], [11.0, 24.63], [26.0, 79.44], [84.0, 84.5], [87.0, 87.52], [88.0, 100.45], [101.0, 102.41], [110.0, 112.77], [114.0, 121.1], [121.0, 121.24], [124.0, 123.92], [125.0, 128.09], [129.0, 160.61], [164.0, 164.84], [168.0, 179.51], [181.0, 183.3], [184.0, 185.26], [186.0, 187.66], [189.0, 189.9], [192.0, 193.5]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [37.51, 31.01, 0.0, 0.0, 0.0, 34.81, 0.0, 45.62, 34.95, 0.0, 0.0, 42.42, 0.0, 0.0, 61.08, 57.48, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 34.31], ["music", 26.49], ["hum", 22.85]], [["music", 53.59], ["hum", 14.66], ["throbbing", 11.3]], null, null, null, [["speech", 26.84], ["music", 15.76], ["thunk", 11.35]], null, [["speech", 27.59], ["music", 18.96], ["hum", 4.95]], [["speech", 54.5], ["single-lens reflex camera", 11.74], ["music", 9.97]], null, null, [["speech", 31.56], ["music", 19.38], ["sheep", 6.21]], null, null, null, null, null, null, null, null], "duration": [4.81, 13.63, 53.44, 0.5, 0.52, 12.45, 1.41, 2.77, 7.1, 0.24, -0.08, 3.09, 31.61, 0.84, 11.51, 2.3, 1.26, 1.66, 0.9, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/kqc4KyCYA0Q_filtered.json b/annotations_filtered/kqc4KyCYA0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93b500ee628022b4b60ff7d051fd3d692553364d --- /dev/null +++ b/annotations_filtered/kqc4KyCYA0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 45.45], [46.0, 47.34], [48.0, 51.8], [52.0, 54.8], [57.0, 87.02], [90.0, 91.45]], "keep_status": [false, false, true, true, false, false], "silence_prob": [32.4, 0.0, 38.91, 33.17, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.18], ["mosquito", 9.96], ["fly, housefly", 4.9]], null, [["music", 28.32], ["hum", 15.28], ["speech", 5.03]], [["music", 44.37], ["theremin", 9.22], ["noise", 8.38]], null, null], "duration": [14.45, 1.34, 3.8, 2.8, 30.02, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/kr2k20G3hCc_filtered.json b/annotations_filtered/kr2k20G3hCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c4a84c59421e6c4fc02fb3f8d0d320b0d330c2f --- /dev/null +++ b/annotations_filtered/kr2k20G3hCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [2.0, 2.83], [4.0, 4.97], [9.0, 12.02], [13.0, 14.25], [14.0, 15.5], [17.0, 20.83], [22.0, 23.9], [26.0, 26.89], [34.0, 35.31], [41.0, 41.35], [43.0, 43.73], [45.0, 45.42], [51.0, 51.33], [62.0, 62.18], [63.0, 68.74], [69.0, 72.39], [74.0, 74.21], [77.0, 78.58], [79.0, 85.6], [92.0, 93.34], [98.0, 99.49], [104.0, 113.1], [113.0, 115.99], [120.0, 121.24], [122.0, 129.27], [131.0, 133.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 46.54, 0.0, 0.0, 34.42, 0.0, 0.0, 30.2, 32.91, 0.0, 30.83, 68.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.66], ["speech", 24.71], ["hum", 4.76]], null, null, [["speech", 46.35], ["hum", 15.73], ["music", 7.43]], null, null, [["speech", 43.19], ["music", 11.93], ["fart", 4.85]], [["speech", 20.05], ["music", 13.17], ["cattle, bovinae", 11.78]], null, [["music", 15.83], ["rumble", 12.41], ["siren", 5.68]], null], "duration": [0.49, 0.83, 0.97, 3.02, 1.25, 1.5, 3.83, 1.9, 0.89, 1.31, 0.35, 0.73, 0.42, 0.33, 0.18, 5.74, 3.39, 0.21, 1.58, 6.6, 1.34, 1.49, 9.1, 2.99, 1.24, 7.27, 2.89]} \ No newline at end of file diff --git a/annotations_filtered/kr5skPIftSY_filtered.json b/annotations_filtered/kr5skPIftSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d28e6c45564670efcfc164b0ad2d771927495c11 --- /dev/null +++ b/annotations_filtered/kr5skPIftSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 55.98], [58.0, 63.04], [64.0, 73.68], [75.0, 75.78], [77.0, 77.63], [79.0, 79.0], [81.0, 85.36]], "keep_status": [false, true, true, false, false, false, true], "silence_prob": [0.0, 30.06, 30.6, 0.0, 0.0, 0.0, 36.02], "audiomae_on_audioset": [null, [["speech", 19.71], ["music", 11.49], ["cattle, bovinae", 11.31]], [["whale vocalization", 20.11], ["hum", 11.83], ["noise", 8.93]], null, null, null, [["music", 34.0], ["whale vocalization", 17.92], ["hum", 13.08]]], "duration": [46.98, 5.04, 9.68, 0.78, 0.63, 0.0, 4.36]} \ No newline at end of file diff --git a/annotations_filtered/krBjSShSxu0_filtered.json b/annotations_filtered/krBjSShSxu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..649e742b440c8eec1bbbc2fb8a1eb9e07ab326ab --- /dev/null +++ b/annotations_filtered/krBjSShSxu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.83], [14.0, 19.5], [20.0, 21.22], [24.0, 28.93], [35.0, 37.66], [51.0, 53.42], [54.0, 72.42], [74.0, 75.9], [77.0, 77.95], [79.0, 85.45], [87.0, 88.33], [96.0, 96.63], [103.0, 103.84], [104.0, 104.4], [105.0, 105.97], [108.0, 108.57], [112.0, 114.67], [116.0, 117.68], [119.0, 125.46], [126.0, 133.14], [136.0, 140.73], [145.0, 148.59], [150.0, 149.89], [152.0, 152.12], [154.0, 154.36], [156.0, 156.03], [159.0, 160.84]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 28.7, 0.0, 30.85, 39.31, 28.83, 30.61, 0.0, 0.0, 40.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 33.4, 29.57, 28.92, 29.18, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 26.48], ["race car, auto racing", 12.67], ["car", 7.7]], null, [["speech", 38.16], ["music", 24.03], ["throbbing", 19.48]], [["music", 77.59], ["throbbing", 7.27], ["hum", 2.59]], [["music", 70.44], ["throbbing", 10.49], ["hum", 3.48]], [["music", 43.51], ["speech", 18.17], ["throbbing", 9.33]], null, null, [["music", 40.37], ["throbbing", 32.29], ["hum", 8.48]], null, null, null, null, null, null, null, null, [["music", 46.64], ["throbbing", 14.14], ["hum", 11.27]], [["music", 54.25], ["speech", 10.95], ["cacophony", 3.89]], [["music", 43.67], ["speech", 25.94], ["hum", 8.52]], [["hum", 25.22], ["music", 20.74], ["throbbing", 9.77]], null, null, null, null, null], "duration": [-0.17, 5.5, 1.22, 4.93, 2.66, 2.42, 18.42, 1.9, 0.95, 6.45, 1.33, 0.63, 0.84, 0.4, 0.97, 0.57, 2.67, 1.68, 6.46, 7.14, 4.73, 3.59, -0.11, 0.12, 0.36, 0.03, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/kr_z37TgQO4_filtered.json b/annotations_filtered/kr_z37TgQO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bfb50d524829496f19ed1a42677349e8670cf10 --- /dev/null +++ b/annotations_filtered/kr_z37TgQO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [8.0, 9.14], [10.0, 10.66], [11.0, 12.01], [13.0, 13.8], [14.0, 15.8], [16.0, 17.24], [18.0, 18.79]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.83, 1.14, 0.66, 1.01, 0.8, 1.8, 1.24, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/krqNvqvhvp0_filtered.json b/annotations_filtered/krqNvqvhvp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/krqNvqvhvp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kswPGoPPdwE_filtered.json b/annotations_filtered/kswPGoPPdwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4df6baa2d2db30ce9a73cdc8f138801c2cc3bbaf --- /dev/null +++ b/annotations_filtered/kswPGoPPdwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [6.0, 8.5], [9.0, 14.82], [16.0, 17.09], [18.0, 19.2], [20.0, 20.63], [23.0, 23.4], [25.0, 25.83], [31.0, 35.11], [37.0, 37.29], [39.0, 40.1], [41.0, 42.33], [44.0, 44.42], [48.0, 48.61], [52.0, 52.34], [59.0, 67.47], [70.0, 70.92], [73.0, 83.15], [88.0, 91.22], [92.0, 93.58], [95.0, 96.21], [97.0, 97.85], [99.0, 100.06], [101.0, 101.71], [103.0, 103.03], [104.0, 106.57], [108.0, 110.17], [112.0, 112.85], [114.0, 114.89], [119.0, 124.36], [127.0, 129.49], [130.0, 131.06], [131.0, 132.33], [137.0, 137.08]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.3, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.53, 0.0, 54.23, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 85.17, 0.0, 0.0, 50.76, 89.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 46.44], ["sidetone", 11.71], ["bee, wasp, etc.", 5.12]], null, null, null, null, null, null, [["mains hum", 48.07], ["hum", 42.88], ["speech", 3.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.92, 2.5, 5.82, 1.09, 1.2, 0.63, 0.4, 0.83, 4.11, 0.29, 1.1, 1.33, 0.42, 0.61, 0.34, 8.47, 0.92, 10.15, 3.22, 1.58, 1.21, 0.85, 1.06, 0.71, 0.03, 2.57, 2.17, 0.85, 0.89, 5.36, 2.49, 1.06, 1.33, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/kt1aHAlXi4g_filtered.json b/annotations_filtered/kt1aHAlXi4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb139386f3ba738b30a743a901886694ab5ebc1 --- /dev/null +++ b/annotations_filtered/kt1aHAlXi4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [3.0, 3.27], [3.0, 12.26], [19.0, 30.33], [34.0, 35.04], [39.0, 53.38], [56.0, 56.29], [57.0, 57.79], [63.0, 67.22], [73.0, 77.97], [79.0, 79.15], [80.0, 86.53], [88.0, 89.99], [92.0, 98.15]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.65, 33.12, 0.0, 31.11, 0.0, 0.0, 36.66, 39.57, 0.0, 45.02, 0.0, 50.81], "audiomae_on_audioset": [null, null, [["hum", 26.37], ["whale vocalization", 15.65], ["music", 10.85]], [["music", 46.43], ["sidetone", 9.2], ["throbbing", 8.35]], null, [["cattle, bovinae", 49.94], ["moo", 26.0], ["livestock, farm animals, working animals", 19.67]], null, null, [["music", 31.23], ["speech", 28.74], ["hum", 4.2]], [["music", 40.02], ["speech", 23.75], ["hum", 6.4]], null, [["fly, housefly", 15.35], ["music", 14.95], ["bee, wasp, etc.", 13.07]], null, null], "duration": [1.08, 0.27, 9.26, 11.33, 1.04, 14.38, 0.29, 0.79, 4.22, 4.97, 0.15, 6.53, 1.99, 6.15]} \ No newline at end of file diff --git a/annotations_filtered/ktCIr_DMGOI_filtered.json b/annotations_filtered/ktCIr_DMGOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa51a9f89a51a5c324322b16bb23af96b2b2b339 --- /dev/null +++ b/annotations_filtered/ktCIr_DMGOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.39], [51.0, 51.53], [78.0, 78.8], [80.0, 86.85], [89.0, 90.69], [92.0, 103.57], [104.0, 103.71], [104.0, 104.95], [112.0, 113.49], [124.0, 125.17], [127.0, 127.21], [129.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.22, 0.0, 30.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 49.89], ["applause", 20.43], ["music", 6.52]], null, [["explosion", 39.29], ["speech", 29.7], ["burst, pop", 10.21]], null, null, null, null, null, null], "duration": [0.39, 0.53, 0.8, 6.85, 1.69, 11.57, -0.29, 0.95, 1.49, 1.17, 0.21, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/ktEW65QQFgQ_filtered.json b/annotations_filtered/ktEW65QQFgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65e2f1ced66b727a3b0ad316d9d169ecaca1786a --- /dev/null +++ b/annotations_filtered/ktEW65QQFgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.44], [11.0, 11.75], [15.0, 49.49], [50.0, 49.54], [50.0, 78.75]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.96], "audiomae_on_audioset": [null, null, null, null, [["music", 75.5], ["didgeridoo", 5.07], ["synthesizer", 5.02]]], "duration": [1.44, 0.75, 34.49, -0.46, 28.75]} \ No newline at end of file diff --git a/annotations_filtered/ktFZq_8XXOg_filtered.json b/annotations_filtered/ktFZq_8XXOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5841d01bd847395e3a4904dee121430bb4bd0812 --- /dev/null +++ b/annotations_filtered/ktFZq_8XXOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.5], [16.0, 17.34], [21.0, 22.13]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.5, 1.34, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/ktGwZKWClZg_filtered.json b/annotations_filtered/ktGwZKWClZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b05b7404d9032d64510cb05dbb279f9070c1edc1 --- /dev/null +++ b/annotations_filtered/ktGwZKWClZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.81], [27.0, 32.56], [34.0, 43.68], [48.0, 50.36], [57.0, 64.4], [69.0, 70.43]], "keep_status": [false, false, true, false, true, false], "silence_prob": [0.0, 42.28, 42.42, 52.74, 40.36, 0.0], "audiomae_on_audioset": [null, [["music", 68.6], ["synthesizer", 4.93], ["musical instrument", 2.98]], [["music", 37.38], ["hum", 13.21], ["mains hum", 8.44]], null, [["music", 33.94], ["hum", 21.04], ["mains hum", 12.3]], null], "duration": [0.81, 5.56, 9.68, 2.36, 7.4, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/ktXm7CRXbsE_filtered.json b/annotations_filtered/ktXm7CRXbsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3df9a7ad4603c2e136e32b148f258fbafdac240 --- /dev/null +++ b/annotations_filtered/ktXm7CRXbsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [7.0, 7.53], [10.0, 10.49], [11.0, 11.6], [16.0, 17.42], [18.0, 18.87], [20.0, 21.2], [23.0, 23.55], [26.0, 26.23], [33.0, 33.34], [35.0, 35.67], [49.0, 49.96], [53.0, 53.55], [57.0, 57.01], [59.0, 59.51], [63.0, 63.1], [66.0, 66.12], [70.0, 70.09], [76.0, 76.65], [80.0, 80.27], [81.0, 82.24], [84.0, 84.33], [99.0, 101.61], [106.0, 106.0], [110.0, 109.97], [114.0, 132.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.53, 0.49, 0.6, 1.42, 0.87, 1.2, 0.55, 0.23, 0.34, 0.67, 0.96, 0.55, 0.01, 0.51, 0.1, 0.12, 0.09, 0.65, 0.27, 1.24, 0.33, 2.61, 0.0, -0.03, 18.83]} \ No newline at end of file diff --git a/annotations_filtered/kthFUFBwbZg_filtered.json b/annotations_filtered/kthFUFBwbZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bb049500195ff1ce8879422bf339d6a68a28825 --- /dev/null +++ b/annotations_filtered/kthFUFBwbZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [12.0, 15.94], [19.0, 23.18], [25.0, 30.03], [31.0, 31.36], [33.0, 32.93], [35.0, 35.56], [37.0, 37.17], [39.0, 41.82], [47.0, 48.81], [52.0, 53.03], [57.0, 58.97], [60.0, 59.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.36, 99.68, 93.13, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 3.94, 4.18, 5.03, 0.36, -0.07, 0.56, 0.17, 2.82, 1.81, 1.03, 1.97, -0.46]} \ No newline at end of file diff --git a/annotations_filtered/ktrGDczwkec_filtered.json b/annotations_filtered/ktrGDczwkec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba2cdb6bd39e3258b9a0234e2b89630d73b039b0 --- /dev/null +++ b/annotations_filtered/ktrGDczwkec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.06], [13.0, 14.17], [15.0, 15.87], [20.0, 21.47], [23.0, 24.92], [27.0, 27.62], [49.0, 51.75], [53.0, 53.2], [54.0, 55.49], [56.0, 57.84], [68.0, 68.0], [73.0, 74.44], [82.0, 82.46], [85.0, 88.86]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26], "audiomae_on_audioset": [[["music", 57.79], ["speech", 6.23], ["fart", 3.23]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.54], ["thunk", 27.55], ["crushing", 4.83]]], "duration": [6.06, 1.17, 0.87, 1.47, 1.92, 0.62, 2.75, 0.2, 1.49, 1.84, 0.0, 1.44, 0.46, 3.86]} \ No newline at end of file diff --git a/annotations_filtered/ktrHO9uETjk_filtered.json b/annotations_filtered/ktrHO9uETjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..355f6cedd5ef8626b344b1010a56b3ff936536c9 --- /dev/null +++ b/annotations_filtered/ktrHO9uETjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.95], [9.0, 9.49], [13.0, 13.51], [16.0, 17.64], [20.0, 20.02], [21.0, 21.86], [28.0, 29.02], [30.0, 30.72], [32.0, 32.8], [34.0, 34.08], [45.0, 45.86], [46.0, 46.85], [48.0, 50.43], [51.0, 52.12], [56.0, 57.48], [60.0, 66.07], [67.0, 68.07], [70.0, 69.84], [72.0, 73.63], [83.0, 89.23], [92.0, 97.39], [100.0, 101.66], [106.0, 106.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.56, 99.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 0.49, 0.51, 1.64, 0.02, 0.86, 1.02, 0.72, 0.8, 0.08, 0.86, 0.85, 2.43, 1.12, 1.48, 6.07, 1.07, -0.16, 1.63, 6.23, 5.39, 1.66, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/ktt64clTkj4_filtered.json b/annotations_filtered/ktt64clTkj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32aa6a13da30c85a0ac088ee74db1e5e9ec57262 --- /dev/null +++ b/annotations_filtered/ktt64clTkj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [6.0, 6.49], [8.0, 9.56], [15.0, 15.31], [20.0, 21.71], [24.0, 24.38], [25.0, 25.89], [26.0, 27.35], [29.0, 29.61], [31.0, 32.97], [35.0, 35.83], [41.0, 41.22], [66.0, 65.96], [71.0, 70.88], [72.0, 73.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.49, 1.56, 0.31, 1.71, 0.38, 0.89, 1.35, 0.61, 1.97, 0.83, 0.22, -0.04, -0.12, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/kuQQoH9skXc_filtered.json b/annotations_filtered/kuQQoH9skXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36f239efa0094b68773bc05d0a33cca601516697 --- /dev/null +++ b/annotations_filtered/kuQQoH9skXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.07], [12.0, 12.01], [41.0, 41.71], [62.0, 74.44], [79.0, 79.0]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 32.76, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.08], ["hum", 15.68], ["whack, thwack", 7.76]], null], "duration": [1.07, 0.01, 0.71, 12.44, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/kuVLtcqiPrY_filtered.json b/annotations_filtered/kuVLtcqiPrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b906146d20a0acd2674446783f8de79f2b5ec23 --- /dev/null +++ b/annotations_filtered/kuVLtcqiPrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.39], [14.0, 15.65], [16.0, 16.33], [18.0, 18.15], [25.0, 25.95], [26.0, 28.48], [30.0, 31.43], [33.0, 33.4], [34.0, 35.55], [37.0, 37.4], [38.0, 39.26], [40.0, 46.26], [47.0, 50.03], [51.0, 52.79], [54.0, 60.1], [62.0, 62.18], [63.0, 78.09], [81.0, 82.39], [85.0, 85.31], [87.0, 91.34], [93.0, 93.65], [96.0, 96.8], [100.0, 101.66], [102.0, 103.4], [104.0, 104.7], [106.0, 113.43], [114.0, 115.72], [116.0, 121.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 67.76, 0.0, 90.08, 0.0, 52.56, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 69.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.65, 0.33, 0.15, 0.95, 2.48, 1.43, 0.4, 1.55, 0.4, 1.26, 6.26, 3.03, 1.79, 6.1, 0.18, 15.09, 1.39, 0.31, 4.34, 0.65, 0.8, 1.66, 1.4, 0.7, 7.43, 1.72, 5.85]} \ No newline at end of file diff --git a/annotations_filtered/kuXEfuC92Ag_filtered.json b/annotations_filtered/kuXEfuC92Ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbf353388d8a3612ed2d92d1ec27b541d2c5c8ea --- /dev/null +++ b/annotations_filtered/kuXEfuC92Ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.36], [22.0, 29.29], [31.0, 34.69], [35.0, 49.94], [51.0, 51.58], [54.0, 61.87], [63.0, 76.11], [78.0, 81.38], [84.0, 89.07], [93.0, 100.87], [103.0, 107.79], [109.0, 111.32], [113.0, 115.11], [117.0, 120.28], [122.0, 124.63], [125.0, 132.16]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [68.8, 81.89, 63.31, 95.78, 0.0, 47.9, 35.74, 52.92, 89.9, 97.43, 99.52, 99.85, 97.92, 98.19, 64.41, 48.31], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 55.26], ["hum", 8.19], ["burping, eructation", 4.71]], [["animal", 28.46], ["hum", 21.33], ["mains hum", 11.84]], null, null, null, null, null, null, null, null, [["speech", 75.53], ["burping, eructation", 11.72], ["hum", 3.28]]], "duration": [2.36, 7.29, 3.69, 14.94, 0.58, 7.87, 13.11, 3.38, 5.07, 7.87, 4.79, 2.32, 2.11, 3.28, 2.63, 7.16]} \ No newline at end of file diff --git a/annotations_filtered/kui9LWtON_k_filtered.json b/annotations_filtered/kui9LWtON_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb71ae9fde7976e094a3e041b0162782c2d2472c --- /dev/null +++ b/annotations_filtered/kui9LWtON_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [6.0, 6.3], [7.0, 11.96], [12.0, 13.24], [14.0, 14.4], [15.0, 15.67], [18.0, 18.17], [19.0, 18.98], [19.0, 19.99], [23.0, 23.48], [26.0, 26.79], [31.0, 31.67], [35.0, 37.42], [38.0, 41.3], [44.0, 44.76], [50.0, 50.5], [56.0, 56.39], [57.0, 57.45], [65.0, 65.28], [68.0, 67.64], [81.0, 81.24], [90.0, 92.26], [97.0, 105.81], [118.0, 119.38], [122.0, 122.81], [132.0, 135.57], [141.0, 141.0], [144.0, 144.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 69.47, 0.0, 0.0, 87.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.72], ["speech", 24.95], ["didgeridoo", 6.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.3, 4.96, 1.24, 0.4, 0.67, 0.17, -0.02, 0.99, 0.48, 0.79, 0.67, 2.42, 3.3, 0.76, 0.5, 0.39, 0.45, 0.28, -0.36, 0.24, 2.26, 8.81, 1.38, 0.81, 3.57, 0.0, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/kv-hhf-kPkw_filtered.json b/annotations_filtered/kv-hhf-kPkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e905753656de65f0b4fb2d341928942d2ce34f02 --- /dev/null +++ b/annotations_filtered/kv-hhf-kPkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [18.0, 19.25], [22.0, 23.94], [27.0, 27.06], [29.0, 30.35], [40.0, 44.86], [50.0, 50.08], [56.0, 57.28], [58.0, 59.93], [64.0, 64.02], [71.0, 75.9], [79.0, 81.13], [90.0, 97.53], [98.0, 103.6], [105.0, 105.68], [108.0, 108.55], [110.0, 113.27], [116.0, 120.41], [121.0, 122.39], [125.0, 133.96], [135.0, 136.59], [137.0, 137.49], [141.0, 143.23], [144.0, 145.25], [146.0, 153.77], [155.0, 156.1], [157.0, 157.69], [159.0, 161.91]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [32.6, 0.0, 0.0, 0.0, 0.0, 30.49, 0.0, 0.0, 0.0, 0.0, 29.95, 29.74, 29.36, 29.47, 0.0, 0.0, 29.11, 28.95, 0.0, 31.01, 0.0, 0.0, 41.81, 0.0, 35.73, 0.0, 0.0, 34.97], "audiomae_on_audioset": [[["music", 43.76], ["musical instrument", 4.15], ["speech", 3.57]], null, null, null, null, [["music", 36.57], ["speech", 14.84], ["explosion", 7.8]], null, null, null, null, [["frog", 31.6], ["fly, housefly", 16.59], ["mosquito", 15.0]], [["speech", 67.41], ["music", 6.91], ["groan", 2.77]], [["buzz", 23.22], ["speech", 19.46], ["music", 6.82]], [["speech", 37.63], ["music", 27.16], ["sidetone", 14.31]], null, null, [["music", 39.04], ["boing", 8.27], ["sound effect", 7.45]], [["music", 44.12], ["carnatic music", 8.73], ["speech", 4.93]], null, [["speech", 68.07], ["boing", 7.82], ["music", 7.44]], null, null, [["music", 34.28], ["didgeridoo", 11.77], ["hum", 6.64]], null, [["speech", 43.11], ["hum", 14.39], ["music", 7.97]], null, null, [["music", 28.93], ["didgeridoo", 11.33], ["insect", 6.07]]], "duration": [2.14, 1.25, 1.94, 0.06, 1.35, 4.86, 0.08, 1.28, 1.93, 0.02, 4.9, 2.13, 7.53, 5.6, 0.68, 0.55, 3.27, 4.41, 1.39, 8.96, 1.59, 0.49, 2.23, 1.25, 7.77, 1.1, 0.69, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/kvAByCIqoOM_filtered.json b/annotations_filtered/kvAByCIqoOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kvAByCIqoOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kvHcswMy05A_filtered.json b/annotations_filtered/kvHcswMy05A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc13d9a269d8f6fc01160a8724cf3c96bf6250da --- /dev/null +++ b/annotations_filtered/kvHcswMy05A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.75], [14.0, 18.79], [21.0, 22.52], [26.0, 29.44], [30.0, 35.38], [36.0, 38.43], [39.0, 53.28], [55.0, 63.93], [64.0, 67.17], [69.0, 78.36], [79.0, 81.65], [83.0, 85.28], [87.0, 89.16], [93.0, 98.63], [100.0, 108.57], [109.0, 117.29], [118.0, 121.69]], "keep_status": [false, true, false, false, false, true, true, false, true, false, true, false, true, false, false, false, true], "silence_prob": [49.45, 47.2, 0.0, 48.87, 36.99, 44.78, 40.38, 42.67, 37.59, 40.21, 47.27, 51.23, 42.86, 43.82, 43.38, 43.53, 47.82], "audiomae_on_audioset": [[["music", 51.19], ["hum", 14.02], ["mains hum", 5.25]], [["hum", 35.17], ["mains hum", 19.11], ["speech", 13.02]], null, [["speech", 33.18], ["music", 33.07], ["hum", 4.5]], [["hum", 35.33], ["mains hum", 25.15], ["speech", 15.67]], [["music", 35.87], ["ambient music", 9.82], ["electronic music", 7.02]], [["speech", 41.83], ["music", 19.38], ["hum", 7.21]], [["music", 40.52], ["speech", 20.38], ["hum", 10.69]], [["music", 27.59], ["speech", 25.73], ["whale vocalization", 14.3]], [["music", 32.09], ["speech", 26.59], ["hum", 17.37]], [["hum", 31.3], ["mains hum", 21.46], ["music", 12.7]], null, [["music", 51.01], ["ambient music", 9.49], ["hum", 7.36]], [["music", 57.54], ["hum", 10.84], ["ambient music", 6.29]], [["speech", 37.66], ["music", 27.82], ["hum", 14.66]], [["hum", 46.08], ["mains hum", 43.65], ["speech", 3.82]], [["hum", 20.9], ["didgeridoo", 19.95], ["mains hum", 14.05]]], "duration": [7.75, 4.79, 1.52, 3.44, 5.38, 2.43, 14.28, 8.93, 3.17, 9.36, 2.65, 2.28, 2.16, 5.63, 8.57, 8.29, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/kvVlP50LSq8_filtered.json b/annotations_filtered/kvVlP50LSq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kvVlP50LSq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kvbYXGOZHnQ_filtered.json b/annotations_filtered/kvbYXGOZHnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c448c721f8f0461265980833b90e0c7b6d1cbb8e --- /dev/null +++ b/annotations_filtered/kvbYXGOZHnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.17], [8.0, 8.45], [9.0, 9.49], [12.0, 14.0], [16.0, 17.9], [21.0, 22.79], [28.0, 33.72], [34.0, 34.99], [36.0, 38.08], [39.0, 41.25], [47.0, 49.47], [52.0, 53.52], [54.0, 55.27], [58.0, 58.21], [72.0, 76.35], [78.0, 80.3]], "keep_status": [true, false, false, false, false, false, true, false, true, true, true, false, false, false, true, true], "silence_prob": [41.48, 0.0, 0.0, 50.66, 0.0, 0.0, 43.43, 0.0, 30.72, 34.16, 36.69, 0.0, 0.0, 0.0, 43.96, 45.69], "audiomae_on_audioset": [[["hum", 11.9], ["throbbing", 7.63], ["music", 6.86]], null, null, null, null, null, [["noise", 29.07], ["hum", 15.95], ["mains hum", 11.34]], null, [["buzzer", 24.4], ["music", 15.32], ["hum", 9.6]], [["hum", 28.55], ["throbbing", 22.98], ["music", 9.81]], [["speech", 50.61], ["music", 11.57], ["hum", 3.92]], null, null, null, [["speech", 39.94], ["noise", 19.91], ["hum", 5.86]], [["radio", 12.34], ["raindrop", 7.75], ["speech", 7.43]]], "duration": [4.17, 0.45, 0.49, 2.0, 1.9, 1.79, 5.72, 0.99, 2.08, 2.25, 2.47, 1.52, 1.27, 0.21, 4.35, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/kvtsZ1Edkk4_filtered.json b/annotations_filtered/kvtsZ1Edkk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cee472719f1467e678b62fb3b6f8196b74a58a77 --- /dev/null +++ b/annotations_filtered/kvtsZ1Edkk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [10.0, 10.08], [15.0, 15.72], [19.0, 19.06], [21.0, 21.36], [35.0, 35.02], [42.0, 42.36], [58.0, 57.96], [60.0, 61.21], [69.0, 70.28], [91.0, 94.22], [97.0, 98.34], [101.0, 101.38], [105.0, 106.15], [110.0, 110.81], [113.0, 114.08], [117.0, 118.56], [122.0, 122.59], [126.0, 128.12], [128.0, 128.19], [128.0, 128.22], [128.0, 128.26], [128.0, 128.29], [128.0, 128.33], [128.0, 128.36], [130.0, 130.72], [148.0, 160.22], [168.0, 168.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 63.87], ["musical instrument", 10.09], ["guitar", 9.6]], null, null, null, null, null, null, null, [["music", 76.08], ["musical instrument", 2.41], ["guitar", 2.3]], null, null, null, null, null, null, null, [["music", 80.52], ["musical instrument", 4.51], ["guitar", 2.56]], null], "duration": [0.6, 0.08, 0.72, 0.06, 0.36, 0.02, 0.36, -0.04, 1.21, 1.28, 3.22, 1.34, 0.38, 1.15, 0.81, 1.08, 1.56, 0.59, 2.12, 0.19, 0.22, 0.26, 0.29, 0.33, 0.36, 0.72, 12.22, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/kvzIRuIg288_filtered.json b/annotations_filtered/kvzIRuIg288_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb52bc7042d9b74e218c7a863ce2a17d3a2a39e --- /dev/null +++ b/annotations_filtered/kvzIRuIg288_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.42], [14.0, 17.31], [18.0, 18.72], [21.0, 21.14], [22.0, 22.11], [24.0, 27.33], [28.0, 30.21], [32.0, 32.21], [33.0, 34.35], [38.0, 41.76], [48.0, 51.7], [53.0, 53.2], [56.0, 56.62], [58.0, 59.24], [61.0, 62.34], [66.0, 71.9], [73.0, 73.82], [79.0, 79.59], [82.0, 82.46], [83.0, 84.37], [86.0, 87.27], [89.0, 89.83], [92.0, 92.11], [96.0, 96.2], [102.0, 102.09], [104.0, 108.24], [109.0, 110.32], [112.0, 112.82], [115.0, 115.38], [116.0, 121.17], [123.0, 123.72], [125.0, 131.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.29, 98.36, 0.0, 0.0, 0.0, 99.99, 77.7, 0.0, 0.0, 100.0, 90.43, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.42, 3.31, 0.72, 0.14, 0.11, 3.33, 2.21, 0.21, 1.35, 3.76, 3.7, 0.2, 0.62, 1.24, 1.34, 5.9, 0.82, 0.59, 0.46, 1.37, 1.27, 0.83, 0.11, 0.2, 0.09, 4.24, 1.32, 0.82, 0.38, 5.17, 0.72, 6.08]} \ No newline at end of file diff --git a/annotations_filtered/kvzzBebEAHQ_filtered.json b/annotations_filtered/kvzzBebEAHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..919de983e9ee276fbbee646decd75bcf3bfc684e --- /dev/null +++ b/annotations_filtered/kvzzBebEAHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 63.59], [64.0, 91.47], [94.0, 96.48], [96.0, 96.53]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 31.81, 34.12, 0.0], "audiomae_on_audioset": [null, [["music", 37.13], ["hum", 7.74], ["throbbing", 5.76]], [["throbbing", 41.19], ["hum", 25.07], ["music", 15.93]], null], "duration": [35.59, 27.47, 2.48, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/kwdRauyX_Sc_filtered.json b/annotations_filtered/kwdRauyX_Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69b616e25e54080fffc053864a20413867328071 --- /dev/null +++ b/annotations_filtered/kwdRauyX_Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.09], [19.0, 19.41], [26.0, 26.33], [30.0, 31.09], [39.0, 39.78], [41.0, 41.01], [43.0, 43.43]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.09, 0.41, 0.33, 1.09, 0.78, 0.01, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/kwvSRZG285g_filtered.json b/annotations_filtered/kwvSRZG285g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e60cf8f982c0eb1cbab22e4fc004d2ce2a2e373 --- /dev/null +++ b/annotations_filtered/kwvSRZG285g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [8.0, 8.24], [12.0, 13.69], [20.0, 21.83], [25.0, 25.44], [27.0, 28.92], [34.0, 36.12], [38.0, 40.93], [45.0, 45.2], [46.0, 46.43], [49.0, 52.0], [56.0, 56.35], [59.0, 60.17], [66.0, 66.85], [69.0, 70.58], [76.0, 76.01], [81.0, 82.02], [83.0, 84.92], [89.0, 96.09], [102.0, 104.43], [105.0, 105.92], [112.0, 115.94], [121.0, 121.49], [124.0, 129.29], [133.0, 132.95], [139.0, 139.92], [147.0, 148.15], [157.0, 158.04], [158.0, 159.21], [164.0, 165.3], [166.0, 166.7], [168.0, 170.63], [173.0, 175.54], [179.0, 181.97], [184.0, 186.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 100.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 99.31, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 98.01, 100.0, 92.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.74, 0.24, 1.69, 1.83, 0.44, 1.92, 2.12, 2.93, 0.2, 0.43, 3.0, 0.35, 1.17, 0.85, 1.58, 0.01, 1.02, 1.92, 7.09, 2.43, 0.92, 3.94, 0.49, 5.29, -0.05, 0.92, 1.15, 1.04, 1.21, 1.3, 0.7, 2.63, 2.54, 2.97, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/kx2FhY_akDY_filtered.json b/annotations_filtered/kx2FhY_akDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99d70f9d169a123a6decb334b6197ab6ecbdde30 --- /dev/null +++ b/annotations_filtered/kx2FhY_akDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [7.0, 7.05], [12.0, 12.63], [13.0, 14.34], [15.0, 25.1], [27.0, 33.35], [35.0, 40.54], [42.0, 47.01], [50.0, 52.95]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.47, 34.47, 32.96, 31.02, 31.83], "audiomae_on_audioset": [null, null, null, null, [["music", 74.15], ["theremin", 2.99], ["didgeridoo", 2.79]], [["music", 77.77], ["crowd", 3.41], ["musical instrument", 2.49]], [["music", 61.9], ["musical instrument", 4.63], ["crowd", 2.03]], [["music", 75.24], ["theremin", 4.11], ["musical instrument", 2.29]], [["music", 63.82], ["speech", 5.64], ["electronic music", 2.59]]], "duration": [1.22, 0.05, 0.63, 1.34, 10.1, 6.35, 5.54, 5.01, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/kxBu82Dte10_filtered.json b/annotations_filtered/kxBu82Dte10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5da43d4358e5a7aa0fc474c39446db38be303c9a --- /dev/null +++ b/annotations_filtered/kxBu82Dte10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [8.0, 10.44], [11.0, 15.74], [29.0, 29.25], [41.0, 43.8], [45.0, 45.66], [48.0, 49.23], [49.0, 49.4], [50.0, 49.86]], "keep_status": [false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 30.69, 31.39, 0.0, 38.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 48.56], ["musical instrument", 5.76], ["double bass", 4.48]], [["music", 35.62], ["guitar", 18.55], ["plucked string instrument", 10.32]], null, [["speech", 36.3], ["fly, housefly", 14.97], ["insect", 9.7]], null, null, null, null], "duration": [1.14, 2.44, 4.74, 0.25, 2.8, 0.66, 1.23, 0.4, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/kxjwb5cXTI0_filtered.json b/annotations_filtered/kxjwb5cXTI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2c7d270b9da426e61789abfa2c24bfa73dcee66 --- /dev/null +++ b/annotations_filtered/kxjwb5cXTI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.78], [15.0, 15.53], [20.0, 20.49], [23.0, 24.0], [24.0, 30.55], [39.0, 39.78], [40.0, 40.68], [43.0, 45.59], [54.0, 54.46], [61.0, 60.72], [68.0, 68.84], [70.0, 70.55], [74.0, 88.1], [92.0, 94.02], [99.0, 99.28], [105.0, 105.14], [109.0, 109.85], [110.0, 110.69], [116.0, 116.85]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [38.41, 0.0, 0.0, 0.0, 39.63, 0.0, 0.0, 44.63, 0.0, 0.0, 0.0, 0.0, 39.4, 41.7, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.24], ["wind instrument, woodwind instrument", 7.06], ["theremin", 5.27]], null, null, null, [["music", 56.34], ["brass instrument", 7.93], ["wind instrument, woodwind instrument", 4.66]], null, null, [["music", 61.39], ["throbbing", 4.77], ["didgeridoo", 4.53]], null, null, null, null, [["music", 42.65], ["foghorn", 9.15], ["double bass", 6.45]], [["music", 62.56], ["mantra", 9.61], ["carnatic music", 3.42]], null, null, null, null, null], "duration": [4.78, 0.53, 0.49, 1.0, 6.55, 0.78, 0.68, 2.59, 0.46, -0.28, 0.84, 0.55, 14.1, 2.02, 0.28, 0.14, 0.85, 0.69, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/kxtAmNDjfj4_filtered.json b/annotations_filtered/kxtAmNDjfj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47cbe70192601b16129554f73612c70fd7dc2c44 --- /dev/null +++ b/annotations_filtered/kxtAmNDjfj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.03], [14.0, 14.67], [16.0, 16.75], [17.0, 17.27], [20.0, 20.85], [25.0, 27.11], [30.0, 31.14], [33.0, 32.93], [36.0, 42.9], [43.0, 43.51], [46.0, 46.97], [49.0, 55.49], [57.0, 57.11], [58.0, 65.13], [66.0, 65.85], [69.0, 69.85], [70.0, 70.95], [71.0, 85.68], [86.0, 87.03], [87.0, 88.69], [89.0, 89.51], [90.0, 90.59], [92.0, 92.3], [93.0, 99.05], [99.0, 104.45], [104.0, 104.5], [105.0, 107.23], [108.0, 108.58], [112.0, 112.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 35.74, 0.0, 0.0, 33.91, 0.0, 35.37, 0.0, 0.0, 0.0, 37.97, 0.0, 0.0, 0.0, 0.0, 0.0, 43.61, 35.89, 0.0, 32.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 71.24], ["domestic animals, pets", 5.16], ["animal", 4.22]], null, null, [["speech", 28.67], ["mosquito", 15.03], ["fly, housefly", 14.44]], null, [["fly, housefly", 66.39], ["insect", 20.08], ["mosquito", 11.57]], null, null, null, [["fly, housefly", 40.9], ["insect", 20.61], ["speech", 8.1]], null, null, null, null, null, [["sidetone", 42.05], ["radio", 13.63], ["speech", 10.08]], [["fly, housefly", 50.4], ["insect", 23.01], ["radio", 6.71]], null, [["speech", 13.66], ["radio", 12.44], ["moo", 4.9]], null, null], "duration": [0.03, 0.67, 0.75, 0.27, 0.85, 2.11, 1.14, -0.07, 6.9, 0.51, 0.97, 6.49, 0.11, 7.13, -0.15, 0.85, 0.95, 14.68, 1.03, 1.69, 0.51, 0.59, 0.3, 6.05, 5.45, 0.5, 2.23, 0.58, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/kxu97nWDapM_filtered.json b/annotations_filtered/kxu97nWDapM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68de540d74aa90d1e8fdfd471534032b1900acf --- /dev/null +++ b/annotations_filtered/kxu97nWDapM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.31], [12.0, 11.97], [14.0, 15.26], [16.0, 17.25], [21.0, 22.35], [25.0, 47.21], [52.0, 55.26], [56.0, 57.27], [58.0, 63.26], [64.0, 64.25], [65.0, 68.28], [69.0, 70.46], [72.0, 72.91], [74.0, 75.14], [76.0, 76.3], [79.0, 80.32], [83.0, 93.29], [99.0, 131.19]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.82, 0.0, 0.0, 0.0, 0.0, 49.64, 72.6, 0.0, 87.74, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 33.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 41.64], ["hum", 9.29], ["throbbing", 5.19]], null, null, null, null, null, null, null, null, null, null, [["speech", 69.23], ["music", 9.4], ["whack, thwack", 4.42]], null], "duration": [2.31, -0.03, 1.26, 1.25, 1.35, 22.21, 3.26, 1.27, 5.26, 0.25, 3.28, 1.46, 0.91, 1.14, 0.3, 1.32, 10.29, 32.19]} \ No newline at end of file diff --git a/annotations_filtered/kxvkI8K7fTo_filtered.json b/annotations_filtered/kxvkI8K7fTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7d7fd1e934b4afe29d3f66a39a02ea264daf912 --- /dev/null +++ b/annotations_filtered/kxvkI8K7fTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [13.0, 15.4], [26.0, 26.13], [27.0, 30.57], [32.0, 32.07], [33.0, 34.45], [38.0, 38.85], [42.0, 44.12], [47.0, 48.3], [50.0, 50.67], [56.0, 56.61], [57.0, 57.7], [58.0, 59.53], [76.0, 77.36], [91.0, 91.88], [105.0, 106.71], [113.0, 113.34], [113.0, 114.12], [118.0, 123.69], [126.0, 127.06], [135.0, 136.31], [140.0, 140.9], [143.0, 143.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 79.59, 0.0, 63.42, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 14.65], ["moo", 12.4], ["mosquito", 11.65]], null, null, null, null], "duration": [0.21, 2.4, 0.13, 3.57, 0.07, 1.45, 0.85, 2.12, 1.3, 0.67, 0.61, 0.7, 1.53, 1.36, 0.88, 1.71, 0.34, 1.12, 5.69, 1.06, 1.31, 0.9, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/ky1W2n5RilM_filtered.json b/annotations_filtered/ky1W2n5RilM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff62a0d2b78f3e27e311908eb190566ed9585bd8 --- /dev/null +++ b/annotations_filtered/ky1W2n5RilM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.97], [30.0, 98.68], [100.0, 101.02], [102.0, 105.14], [107.0, 107.65], [109.0, 110.2], [111.0, 112.21], [115.0, 115.62], [119.0, 120.66], [122.0, 123.5], [128.0, 129.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.15, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 24.63], ["speech", 21.84], ["carnatic music", 7.75]], null, null, null, null, null, null, null, null, null, null], "duration": [15.97, 68.68, 1.02, 3.14, 0.65, 1.2, 1.21, 0.62, 1.66, 1.5, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/ky1semsHhAY_filtered.json b/annotations_filtered/ky1semsHhAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f291aeb2f1ffb8accf0dc754f8228a8a6172ca3 --- /dev/null +++ b/annotations_filtered/ky1semsHhAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [13.0, 14.01], [16.0, 16.61], [19.0, 25.1], [27.0, 29.35], [31.0, 31.82], [33.0, 37.37], [38.0, 41.12], [42.0, 45.72], [47.0, 48.83], [50.0, 55.22], [56.0, 56.44], [57.0, 60.88], [63.0, 88.33], [90.0, 96.84], [99.0, 98.9], [104.0, 105.6], [110.0, 111.48], [116.0, 116.75], [118.0, 118.3], [120.0, 122.25], [123.0, 123.36], [125.0, 126.0], [127.0, 128.49]], "keep_status": [false, false, false, true, true, false, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.52, 37.89, 0.0, 51.71, 41.83, 39.25, 0.0, 49.97, 0.0, 32.83, 80.11, 45.05, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 20.95], ["howl", 16.04], ["animal", 14.99]], [["singing bowl", 18.35], ["music", 14.72], ["wind instrument, woodwind instrument", 8.27]], null, null, [["mains hum", 21.56], ["speech", 18.76], ["music", 12.4]], [["music", 30.21], ["theremin", 19.26], ["foghorn", 15.66]], null, [["mains hum", 20.34], ["music", 17.71], ["hum", 14.07]], null, [["speech", 74.31], ["sidetone", 9.6], ["busy signal", 3.58]], null, [["hum", 31.12], ["whale vocalization", 6.66], ["throbbing", 6.37]], null, null, null, null, null, [["speech", 83.98], ["telephone", 8.74], ["dial tone", 1.83]], null, null, null], "duration": [1.82, 1.01, 0.61, 6.1, 2.35, 0.82, 4.37, 3.12, 3.72, 1.83, 5.22, 0.44, 3.88, 25.33, 6.84, -0.1, 1.6, 1.48, 0.75, 0.3, 2.25, 0.36, 1.0, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/kyGcsRDBJLM_filtered.json b/annotations_filtered/kyGcsRDBJLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dcda4181f642371d986f6f9727d7fdf7075fb11 --- /dev/null +++ b/annotations_filtered/kyGcsRDBJLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 47.34], [48.0, 52.78], [56.0, 55.78], [57.0, 74.98], [76.0, 75.95]], "keep_status": [true, true, false, true, false], "silence_prob": [31.16, 44.6, 0.0, 32.58, 0.0], "audiomae_on_audioset": [[["music", 54.72], ["hum", 7.0], ["noise", 6.97]], [["hum", 39.2], ["music", 17.04], ["mains hum", 9.98]], null, [["music", 51.27], ["noise", 12.0], ["synthesizer", 6.36]], null], "duration": [14.34, 4.78, -0.22, 17.98, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/kyY50rBet2U_filtered.json b/annotations_filtered/kyY50rBet2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b1f777ae6e1d9bd92824cfcb59eb2a5657d9e2 --- /dev/null +++ b/annotations_filtered/kyY50rBet2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.27], [32.0, 37.71], [38.0, 40.73], [43.0, 50.16], [51.0, 53.87], [54.0, 58.95], [65.0, 67.66]], "keep_status": [true, true, false, false, false, true, true], "silence_prob": [30.05, 30.65, 34.96, 29.27, 30.33, 30.55, 33.06], "audiomae_on_audioset": [[["music", 33.57], ["throbbing", 15.47], ["hum", 11.87]], [["cattle, bovinae", 19.05], ["throbbing", 15.33], ["music", 14.57]], [["music", 31.36], ["hum", 23.89], ["throbbing", 19.38]], [["speech", 69.64], ["explosion", 3.67], ["music", 3.58]], [["speech", 39.2], ["music", 37.44], ["sidetone", 4.54]], [["speech", 59.49], ["vehicle", 5.25], ["mains hum", 4.06]], [["music", 26.83], ["speech", 23.91], ["hum", 9.02]]], "duration": [2.27, 5.71, 2.73, 7.16, 2.87, 4.95, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/kye191FZmeU_filtered.json b/annotations_filtered/kye191FZmeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8944f173c642a1efbdf9a075c93d9c8a64712d --- /dev/null +++ b/annotations_filtered/kye191FZmeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.43], [8.0, 11.91], [15.0, 19.01], [19.0, 22.3], [34.0, 37.61], [39.0, 40.07], [41.0, 41.18], [43.0, 43.48], [44.0, 45.03], [46.0, 46.55], [51.0, 50.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 91.64, 99.48, 98.99, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [3.43, 3.91, 4.01, 3.3, 3.61, 1.07, 0.18, 0.48, 1.03, 0.55, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/kyfMjDlcisQ_filtered.json b/annotations_filtered/kyfMjDlcisQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee7e7bc4451f91a3089d3682dfd10f961e647bb8 --- /dev/null +++ b/annotations_filtered/kyfMjDlcisQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.99], [16.0, 18.12], [19.0, 41.74], [45.0, 46.41], [48.0, 55.88], [58.0, 68.22], [75.0, 82.39]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [30.41, 29.3, 29.64, 0.0, 29.55, 29.76, 29.34], "audiomae_on_audioset": [[["music", 58.27], ["guitar", 4.39], ["musical instrument", 3.92]], [["music", 69.32], ["guitar", 5.87], ["plucked string instrument", 4.08]], [["music", 63.3], ["hum", 5.12], ["synthesizer", 4.78]], null, [["music", 67.39], ["sitar", 13.35], ["carnatic music", 7.55]], [["music", 53.99], ["hum", 13.91], ["throbbing", 11.6]], [["music", 59.75], ["sitar", 9.18], ["carnatic music", 7.96]]], "duration": [4.99, 2.12, 22.74, 1.41, 7.88, 10.22, 7.39]} \ No newline at end of file diff --git a/annotations_filtered/kytDzjuBGJI_filtered.json b/annotations_filtered/kytDzjuBGJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/kytDzjuBGJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/kzVO5JrnEJ8_filtered.json b/annotations_filtered/kzVO5JrnEJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3caefeaa8657d212ab40c762e8d3f70ef5e69381 --- /dev/null +++ b/annotations_filtered/kzVO5JrnEJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.38], [10.0, 10.29], [11.0, 11.82], [20.0, 20.01], [22.0, 23.08], [24.0, 24.8], [27.0, 27.33], [28.0, 32.56], [34.0, 33.86], [38.0, 40.98], [49.0, 51.26], [56.0, 57.0], [64.0, 64.57], [69.0, 71.68], [75.0, 75.22], [77.0, 79.79], [84.0, 85.26], [96.0, 98.56], [100.0, 104.41], [107.0, 108.41], [110.0, 110.66], [112.0, 116.94], [122.0, 123.03], [124.0, 124.56], [125.0, 124.6], [125.0, 126.17], [134.0, 135.92], [137.0, 143.29], [144.0, 144.49], [152.0, 153.0]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 42.84, 50.41, 0.0, 0.0, 60.6, 0.0, 35.73, 0.0, 70.44, 99.1, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 35.95], ["music", 23.96], ["hum", 9.06]], null, null, null, null, null, [["music", 42.56], ["applause", 24.52], ["crowd", 3.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.38, 0.29, 0.82, 0.01, 1.08, 0.8, 0.33, 4.56, -0.14, 2.98, 2.26, 1.0, 0.57, 2.68, 0.22, 2.79, 1.26, 2.56, 4.41, 1.41, 0.66, 4.94, 1.03, 0.56, -0.4, 1.17, 1.92, 6.29, 0.49, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/kzZQYnvw-6E_filtered.json b/annotations_filtered/kzZQYnvw-6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e250924417f5bd5e6271b8f793e8e8ac862bf49 --- /dev/null +++ b/annotations_filtered/kzZQYnvw-6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.04], [28.0, 30.62], [35.0, 36.56], [38.0, 40.59], [42.0, 42.74], [44.0, 51.06], [55.0, 58.97], [62.0, 65.37], [79.0, 79.02], [83.0, 82.63], [92.0, 92.62], [103.0, 103.96], [106.0, 106.0], [108.0, 108.24], [113.0, 117.14], [119.0, 127.31], [132.0, 132.63], [134.0, 137.71], [151.0, 151.88], [153.0, 162.89], [164.0, 166.18], [171.0, 171.69]], "keep_status": [true, true, false, true, false, false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false], "silence_prob": [31.87, 33.45, 0.0, 30.33, 0.0, 31.69, 34.35, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.65, 30.95, 0.0, 32.0, 0.0, 30.54, 29.93, 0.0], "audiomae_on_audioset": [[["speech", 26.01], ["thunk", 11.18], ["explosion", 8.42]], [["roaring cats (lions, tigers)", 17.26], ["animal", 15.75], ["roar", 13.9]], null, [["speech", 46.09], ["grunt", 14.66], ["fart", 8.91]], null, [["cattle, bovinae", 46.48], ["moo", 25.63], ["livestock, farm animals, working animals", 16.75]], [["groan", 50.44], ["grunt", 11.14], ["roar", 4.96]], [["speech", 79.75], ["sine wave", 2.76], ["sidetone", 1.68]], null, null, null, null, null, null, [["whack, thwack", 27.44], ["speech", 18.8], ["music", 9.42]], [["music", 33.3], ["speech", 17.03], ["groan", 17.0]], null, [["speech", 16.28], ["music", 6.88], ["hum", 6.78]], null, [["speech", 36.5], ["music", 36.33], ["didgeridoo", 10.63]], [["speech", 28.85], ["groan", 13.62], ["cattle, bovinae", 5.8]], null], "duration": [4.04, 2.62, 1.56, 2.59, 0.74, 7.06, 3.97, 3.37, 0.02, -0.37, 0.62, 0.96, 0.0, 0.24, 4.14, 8.31, 0.63, 3.71, 0.88, 9.89, 2.18, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/kzf7hr9O00k_filtered.json b/annotations_filtered/kzf7hr9O00k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9866c94894100de6a12ce50c0e343154abc4ba --- /dev/null +++ b/annotations_filtered/kzf7hr9O00k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [14.0, 14.34], [16.0, 17.12], [25.0, 26.16], [40.0, 43.5], [44.0, 43.63], [52.0, 53.67], [56.0, 60.2], [63.0, 67.26], [68.0, 75.68], [81.0, 81.53], [87.0, 88.64], [94.0, 94.56], [105.0, 105.6], [111.0, 112.04], [113.0, 113.39], [122.0, 122.59], [126.0, 126.05], [133.0, 133.22], [141.0, 141.47]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 34.41, 33.93, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 53.46], ["speech", 6.61], ["electronic music", 4.32]], null, null, [["music", 67.92], ["musical instrument", 6.36], ["didgeridoo", 3.8]], [["speech", 48.82], ["music", 35.76], ["throbbing", 3.53]], [["music", 34.12], ["speech", 16.33], ["didgeridoo", 15.29]], null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.34, 1.12, 1.16, 3.5, -0.37, 1.67, 4.2, 4.26, 7.68, 0.53, 1.64, 0.56, 0.6, 1.04, 0.39, 0.59, 0.05, 0.22, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/kzu2Gwn-sPA_filtered.json b/annotations_filtered/kzu2Gwn-sPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59b5bba0e2d52b8c139ee7ef8da66bf2bc845ead --- /dev/null +++ b/annotations_filtered/kzu2Gwn-sPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.54], [7.0, 8.5], [13.0, 12.8], [17.0, 17.1], [19.0, 19.52], [28.0, 28.38], [32.0, 31.7], [40.0, 40.9], [49.0, 49.3], [52.0, 52.3], [53.0, 57.84], [58.0, 59.26], [62.0, 62.45], [64.0, 64.45], [68.0, 68.93], [72.0, 72.25], [74.0, 75.2], [77.0, 77.87], [79.0, 79.17], [82.0, 82.66], [83.0, 84.35], [85.0, 87.27], [90.0, 90.63], [96.0, 96.25], [98.0, 98.76], [104.0, 104.97], [107.0, 107.81], [109.0, 112.68], [113.0, 114.42], [117.0, 117.96], [119.0, 120.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 79.84], ["noise", 2.63], ["boing", 1.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.46, 1.5, -0.2, 0.1, 0.52, 0.38, -0.3, 0.9, 0.3, 0.3, 4.84, 1.26, 0.45, 0.45, 0.93, 0.25, 1.2, 0.87, 0.17, 0.66, 1.35, 2.27, 0.63, 0.25, 0.76, 0.97, 0.81, 3.68, 1.42, 0.96, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/kzueHOeJk40_filtered.json b/annotations_filtered/kzueHOeJk40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83016d7fe1f2555ac595d42a05a59bc2f7415dc6 --- /dev/null +++ b/annotations_filtered/kzueHOeJk40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.63], [34.0, 35.95], [51.0, 52.51], [58.0, 58.09], [74.0, 78.22], [79.0, 83.17], [85.0, 85.67], [88.0, 89.16], [95.0, 96.25], [99.0, 99.76], [103.0, 103.17], [109.0, 110.1], [127.0, 127.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.75, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 69.97], ["singing", 5.48], ["a capella", 4.13]], [["music", 80.0], ["musical instrument", 2.75], ["guitar", 2.69]], null, null, null, null, null, null, null], "duration": [1.63, 1.95, 1.51, 0.09, 4.22, 4.17, 0.67, 1.16, 1.25, 0.76, 0.17, 1.1, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/kzxSZ5zCfXs_filtered.json b/annotations_filtered/kzxSZ5zCfXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa9b16a9f60d67a6bcaf1f387f8699d78656a68 --- /dev/null +++ b/annotations_filtered/kzxSZ5zCfXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.1], [30.0, 34.7], [36.0, 40.37], [41.0, 53.47], [56.0, 58.72], [60.0, 61.2], [64.0, 65.35]], "keep_status": [false, true, true, true, false, false, false], "silence_prob": [28.96, 28.76, 28.91, 29.13, 29.6, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 45.01], ["buzz", 17.46], ["vehicle", 11.94]], [["speech", 44.77], ["vehicle", 20.06], ["hum", 4.91]], [["hum", 27.95], ["mains hum", 18.24], ["breaking", 9.42]], [["speech", 23.24], ["electric shaver, electric razor", 18.65], ["buzz", 15.01]], [["mains hum", 46.39], ["hum", 28.84], ["speech", 7.44]], null, null], "duration": [4.1, 4.7, 4.37, 12.47, 2.72, 1.2, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/kzxz5xezOAI_filtered.json b/annotations_filtered/kzxz5xezOAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b896f7ae2c3e50c308d40585c38ed0c20fe00bab --- /dev/null +++ b/annotations_filtered/kzxz5xezOAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.15], [15.0, 15.85], [23.0, 24.14], [29.0, 30.5], [32.0, 32.95], [34.0, 34.42], [37.0, 38.25], [46.0, 47.53], [54.0, 54.19], [56.0, 57.99], [59.0, 60.03], [62.0, 66.97], [69.0, 70.02], [71.0, 72.03], [73.0, 81.43], [84.0, 84.08]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0, 32.04, 0.0], "audiomae_on_audioset": [[["noise", 26.46], ["hum", 15.62], ["music", 10.78]], null, null, null, null, null, null, null, null, null, null, [["speech", 26.45], ["whale vocalization", 24.88], ["hum", 8.82]], null, null, [["speech", 44.02], ["animal", 7.14], ["electric shaver, electric razor", 6.3]], null], "duration": [7.15, 0.85, 1.14, 1.5, 0.95, 0.42, 1.25, 1.53, 0.19, 1.99, 1.03, 4.97, 1.02, 1.03, 8.43, 0.08]} \ No newline at end of file