diff --git a/annotations_filtered/f-3Bldu8BJ4_filtered.json b/annotations_filtered/f-3Bldu8BJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9848ec3a303b5eee661e37f01b35ed22aef2be6 --- /dev/null +++ b/annotations_filtered/f-3Bldu8BJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [8.0, 10.2], [12.0, 15.55], [17.0, 19.48], [21.0, 26.1], [27.0, 31.06], [33.0, 36.26], [37.0, 43.83], [44.0, 46.18], [46.0, 46.21], [64.0, 64.45], [66.0, 70.31], [75.0, 77.09], [82.0, 81.92], [85.0, 89.72], [93.0, 98.47], [100.0, 99.94], [103.0, 109.32], [110.0, 111.86], [113.0, 115.91], [117.0, 127.53], [128.0, 130.23], [132.0, 133.1], [137.0, 137.61], [138.0, 141.12], [144.0, 150.92], [153.0, 156.61], [157.0, 158.53], [159.0, 160.78], [162.0, 162.58], [164.0, 163.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.51, 87.92, 82.07, 81.35, 79.41, 78.38, 82.07, 94.81, 73.97, 0.0, 0.0, 62.68, 80.82, 0.0, 68.67, 74.44, 0.0, 57.64, 0.0, 99.59, 64.63, 84.98, 0.0, 0.0, 81.35, 68.8, 75.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.09, 2.2, 3.55, 2.48, 5.1, 4.06, 3.26, 6.83, 2.18, 0.21, 0.45, 4.31, 2.09, -0.08, 4.72, 5.47, -0.06, 6.32, 1.86, 2.91, 10.53, 2.23, 1.1, 0.61, 3.12, 6.92, 3.61, 1.53, 1.78, 0.58, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/f-77xulkB_U_filtered.json b/annotations_filtered/f-77xulkB_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d570e95f68f75880a73741990e07a3004638e815 --- /dev/null +++ b/annotations_filtered/f-77xulkB_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.71], [11.0, 13.29], [15.0, 15.42], [17.0, 17.42], [21.0, 21.61], [25.0, 26.1], [27.0, 27.84], [29.0, 29.1], [31.0, 32.07], [35.0, 35.8], [38.0, 39.34], [40.0, 40.44], [41.0, 43.6], [45.0, 50.36], [54.0, 65.74], [67.0, 68.81], [91.0, 92.01], [101.0, 102.76], [107.0, 107.16], [108.0, 109.71], [110.0, 111.23], [112.0, 113.05], [119.0, 121.02], [123.0, 123.36], [126.0, 129.09], [130.0, 135.67], [136.0, 137.47], [139.0, 140.0], [147.0, 150.38], [151.0, 152.25], [154.0, 154.92], [159.0, 159.46], [161.0, 161.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [42.48, 38.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 64.86, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 0.0, 47.23, 46.61, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 60.55], ["speech", 22.86], ["radio", 4.85]], [["speech", 70.08], ["sidetone", 14.6], ["radio", 4.19]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 88.4], ["boing", 2.93], ["sidetone", 0.99]], null, null, null, null, null, null, null, [["speech", 64.18], ["telephone", 9.45], ["dial tone", 8.38]], null, [["music", 38.45], ["crushing", 28.34], ["musical instrument", 4.74]], [["music", 44.91], ["crushing", 11.43], ["effects unit", 10.28]], null, null, [["music", 49.38], ["didgeridoo", 8.44], ["theremin", 4.49]], null, null, null, null], "duration": [3.71, 2.29, 0.42, 0.42, 0.61, 1.1, 0.84, 0.1, 1.07, 0.8, 1.34, 0.44, 2.6, 5.36, 11.74, 1.81, 1.01, 1.76, 0.16, 1.71, 1.23, 1.05, 2.02, 0.36, 3.09, 5.67, 1.47, 1.0, 3.38, 1.25, 0.92, 0.46, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/f-DgdMpSo7c_filtered.json b/annotations_filtered/f-DgdMpSo7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7636d5df11ca5c208bf03ce5a17e619a9da05b1 --- /dev/null +++ b/annotations_filtered/f-DgdMpSo7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.51], [28.0, 28.81], [29.0, 29.49], [30.0, 30.15], [31.0, 30.75], [32.0, 32.7], [33.0, 33.56], [35.0, 35.73], [37.0, 37.77], [39.0, 39.41], [40.0, 40.41], [41.0, 41.37], [42.0, 43.02], [47.0, 47.33], [49.0, 68.05], [76.0, 77.36], [84.0, 85.35], [92.0, 93.87], [98.0, 98.04], [100.0, 100.48], [110.0, 122.69], [123.0, 122.82], [126.0, 125.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 30.5], ["mosquito", 13.89], ["cattle, bovinae", 12.98]], null, null, null, null, null, [["music", 48.63], ["groan", 6.31], ["fart", 5.29]], null, null], "duration": [5.51, 0.81, 0.49, 0.15, -0.25, 0.7, 0.56, 0.73, 0.77, 0.41, 0.41, 0.37, 1.02, 0.33, 19.05, 1.36, 1.35, 1.87, 0.04, 0.48, 12.69, -0.18, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/f-DiniX_1mI_filtered.json b/annotations_filtered/f-DiniX_1mI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf08c41fc2b79477fdacee974b9fbb27f01d0d0 --- /dev/null +++ b/annotations_filtered/f-DiniX_1mI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.78], [17.0, 17.74], [18.0, 20.87], [28.0, 29.39], [30.0, 30.75], [33.0, 35.83], [37.0, 37.66], [39.0, 39.78], [41.0, 44.93], [48.0, 54.73], [69.0, 72.22]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 64.41, 0.0, 0.0, 31.25, 0.0, 0.0, 32.17, 29.61, 60.42], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 38.09], ["gunshot, gunfire", 18.54], ["burst, pop", 18.34]], null, null, [["explosion", 36.08], ["burst, pop", 14.05], ["gunshot, gunfire", 9.82]], [["gunshot, gunfire", 29.6], ["explosion", 13.98], ["clang", 9.46]], null], "duration": [0.78, 0.74, 2.87, 1.39, 0.75, 2.83, 0.66, 0.78, 3.93, 6.73, 3.22]} \ No newline at end of file diff --git a/annotations_filtered/f-EjBwpuVFI_filtered.json b/annotations_filtered/f-EjBwpuVFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327a97dac1267e092dd2c587ff0fac2615669909 --- /dev/null +++ b/annotations_filtered/f-EjBwpuVFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 23.82], [30.0, 43.38], [46.0, 49.06], [51.0, 51.31], [54.0, 56.74], [66.0, 66.99], [74.0, 75.71], [77.0, 76.96], [79.0, 80.43], [84.0, 86.26], [89.0, 99.25], [99.0, 103.98], [104.0, 118.42], [123.0, 134.65], [139.0, 141.72], [149.0, 149.93], [151.0, 152.76], [158.0, 158.43], [171.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, true], "silence_prob": [34.94, 37.89, 43.56, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 40.9, 38.84, 48.31, 37.31, 34.63, 44.55, 0.0, 0.0, 0.0, 39.61], "audiomae_on_audioset": [[["music", 56.38], ["hum", 8.73], ["musical instrument", 5.93]], [["music", 59.06], ["didgeridoo", 17.49], ["insect", 3.35]], [["music", 76.92], ["didgeridoo", 3.25], ["musical instrument", 2.48]], null, [["music", 67.29], ["electronic music", 6.86], ["synthesizer", 3.75]], null, null, null, null, [["speech", 32.91], ["music", 15.78], ["hum", 15.63]], [["music", 70.01], ["hum", 5.02], ["electronic music", 3.41]], [["music", 35.05], ["speech", 24.42], ["whale vocalization", 8.18]], [["music", 35.91], ["speech", 21.4], ["whale vocalization", 5.14]], [["music", 31.24], ["hum", 25.55], ["throbbing", 11.53]], [["music", 49.66], ["pulse", 18.57], ["theremin", 6.33]], null, null, null, [["music", 42.22], ["buzz", 9.42], ["didgeridoo", 4.76]]], "duration": [16.82, 13.38, 3.06, 0.31, 2.74, 0.99, 1.71, -0.04, 1.43, 2.26, 10.25, 4.98, 14.42, 11.65, 2.72, 0.93, 1.76, 0.43, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/f-PnGRaJaSA_filtered.json b/annotations_filtered/f-PnGRaJaSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e67e0234ff210c5f07e9a0506823bfd536d4a39 --- /dev/null +++ b/annotations_filtered/f-PnGRaJaSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.1], [6.0, 6.54], [7.0, 7.75], [9.0, 8.92], [13.0, 12.68], [14.0, 14.23], [35.0, 37.99], [49.0, 49.81], [52.0, 53.1], [56.0, 57.27], [66.0, 66.6], [68.0, 68.88], [73.0, 73.58], [75.0, 77.7], [90.0, 90.41], [105.0, 105.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.34], ["theremin", 23.65], ["throbbing", 3.55]], null, null, null, null, null, null, [["theremin", 40.58], ["music", 34.95], ["musical instrument", 4.81]], null, null], "duration": [1.1, 0.54, 0.75, -0.08, -0.32, 0.23, 2.99, 0.81, 1.1, 1.27, 0.6, 0.88, 0.58, 2.7, 0.41, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/f-vA6GMMKgQ_filtered.json b/annotations_filtered/f-vA6GMMKgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..207a23b535a1a9d7b07d040ee4fcf47fb035c258 --- /dev/null +++ b/annotations_filtered/f-vA6GMMKgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.1], [6.0, 7.28], [10.0, 10.57], [19.0, 19.94], [22.0, 22.23], [24.0, 24.61], [26.0, 26.62], [34.0, 34.5], [38.0, 37.76], [41.0, 41.54], [42.0, 42.38], [49.0, 53.08], [54.0, 54.65], [56.0, 57.11], [60.0, 60.91], [64.0, 64.66], [67.0, 67.46], [83.0, 83.22], [89.0, 90.04], [95.0, 95.1], [100.0, 99.89], [101.0, 101.73], [103.0, 107.06], [113.0, 114.07], [114.0, 115.5], [116.0, 116.4], [117.0, 117.37], [120.0, 120.16], [122.0, 122.34], [125.0, 124.87], [126.0, 126.37], [127.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 1.28, 0.57, 0.94, 0.23, 0.61, 0.62, 0.5, -0.24, 0.54, 0.38, 4.08, 0.65, 1.11, 0.91, 0.66, 0.46, 0.22, 1.04, 0.1, -0.11, 0.73, 4.06, 1.07, 1.5, 0.4, 0.37, 0.16, 0.34, -0.13, 0.37, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/f0-Ea9Ki7YU_filtered.json b/annotations_filtered/f0-Ea9Ki7YU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf71aaa6185c4382b70c3a038ce1aa5a68d25d7 --- /dev/null +++ b/annotations_filtered/f0-Ea9Ki7YU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.48], [15.0, 35.48], [40.0, 96.01], [97.0, 98.04], [100.0, 120.31], [121.0, 121.78], [127.0, 127.33], [129.0, 130.23], [132.0, 132.21], [133.0, 133.93], [138.0, 138.33], [139.0, 140.86], [141.0, 148.05], [149.0, 151.87], [153.0, 154.65], [156.0, 179.29], [180.0, 180.76]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.68, 28.37, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 64.52, 0.0, 29.87, 0.0], "audiomae_on_audioset": [[["music", 43.22], ["buzzer", 10.91], ["theremin", 8.38]], [["music", 71.47], ["didgeridoo", 8.21], ["musical instrument", 3.24]], null, null, [["trombone", 23.01], ["music", 22.49], ["brass instrument", 21.31]], null, null, null, null, null, null, null, null, null, null, [["theremin", 60.98], ["music", 30.85], ["musical instrument", 0.87]], null], "duration": [3.48, 20.48, 56.01, 1.04, 20.31, 0.78, 0.33, 1.23, 0.21, 0.93, 0.33, 1.86, 7.05, 2.87, 1.65, 23.29, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/f06qimixOOI_filtered.json b/annotations_filtered/f06qimixOOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39bf11a64bc30e5bd67f7fde2bcca26fcb93a4bf --- /dev/null +++ b/annotations_filtered/f06qimixOOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 6.67], [9.0, 18.32], [20.0, 28.16], [31.0, 51.14], [52.0, 51.71], [55.0, 55.05], [56.0, 65.67], [67.0, 69.21], [73.0, 83.49], [86.0, 91.59]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 81.53, 72.31, 33.6, 0.0, 0.0, 30.5, 50.56, 46.47, 29.07], "audiomae_on_audioset": [null, null, null, null, [["music", 61.82], ["musical instrument", 4.5], ["singing bowl", 2.76]], null, null, [["music", 18.4], ["livestock, farm animals, working animals", 17.67], ["cattle, bovinae", 10.12]], null, [["music", 61.56], ["effects unit", 9.36], ["guitar", 6.42]], [["didgeridoo", 33.32], ["speech", 28.02], ["music", 23.54]]], "duration": [1.31, 1.67, 9.32, 8.16, 20.14, -0.29, 0.05, 9.67, 2.21, 10.49, 5.59]} \ No newline at end of file diff --git a/annotations_filtered/f08pzusjWTQ_filtered.json b/annotations_filtered/f08pzusjWTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adf7ec0f779b2253ad06fea342c92652bbea6e13 --- /dev/null +++ b/annotations_filtered/f08pzusjWTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.46], [4.0, 5.04], [9.0, 9.69], [11.0, 12.01], [15.0, 16.85], [18.0, 18.67], [20.0, 20.95], [23.0, 24.12], [25.0, 26.79], [28.0, 30.48], [32.0, 36.49], [38.0, 43.26], [47.0, 57.3], [59.0, 59.63], [63.0, 63.78], [70.0, 77.75], [79.0, 80.65], [82.0, 82.31], [83.0, 84.79], [86.0, 87.02], [88.0, 88.99], [96.0, 96.74], [100.0, 100.87], [107.0, 108.62], [110.0, 110.42], [111.0, 116.38], [118.0, 119.45], [123.0, 127.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 92.97, 98.44, 47.58, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 41.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 44.34], ["music", 37.89], ["effects unit", 3.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 54.02], ["music", 18.27], ["speech", 9.82]]], "duration": [1.46, 1.04, 0.69, 1.01, 1.85, 0.67, 0.95, 1.12, 1.79, 2.48, 4.49, 5.26, 10.3, 0.63, 0.78, 7.75, 1.65, 0.31, 1.79, 1.02, 0.99, 0.74, 0.87, 1.62, 0.42, 5.38, 1.45, 4.36]} \ No newline at end of file diff --git a/annotations_filtered/f0MBL-DyXaE_filtered.json b/annotations_filtered/f0MBL-DyXaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7497aff61c67a8323a8d8ee1acf72fc4de0086cb --- /dev/null +++ b/annotations_filtered/f0MBL-DyXaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.89], [5.0, 13.51], [14.0, 13.61], [16.0, 29.4], [33.0, 33.25], [39.0, 39.24], [49.0, 51.16], [53.0, 54.36], [55.0, 57.1], [58.0, 59.54], [62.0, 63.91], [66.0, 66.53], [75.0, 76.01], [77.0, 79.98], [81.0, 81.16], [82.0, 82.24], [85.0, 85.62]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.91, 37.51, 0.0, 36.31, 0.0, 0.0, 67.51, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.8], ["music", 10.92], ["explosion", 5.67]], null, [["motorboat, speedboat", 29.02], ["boat, water vehicle", 23.89], ["music", 9.57]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.89, 8.51, -0.39, 13.4, 0.25, 0.24, 2.16, 1.36, 2.1, 1.54, 1.91, 0.53, 1.01, 2.98, 0.16, 0.24, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/f0eTISgJ3Io_filtered.json b/annotations_filtered/f0eTISgJ3Io_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f14a314bb9c20b55d4040db8dae7015a926403b --- /dev/null +++ b/annotations_filtered/f0eTISgJ3Io_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 54.84], [57.0, 56.84], [61.0, 76.76], [78.0, 79.32], [85.0, 87.05], [88.0, 89.53]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.92, 0.0, 33.01, 0.0], "audiomae_on_audioset": [null, null, [["speech", 78.94], ["fart", 8.14], ["throbbing", 1.8]], null, [["hum", 29.92], ["mains hum", 25.36], ["throbbing", 17.83]], null], "duration": [0.84, -0.16, 15.76, 1.32, 2.05, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/f0sDG0nnftw_filtered.json b/annotations_filtered/f0sDG0nnftw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aab1ab2850bfafa19bcefcfeb0439425c6815270 --- /dev/null +++ b/annotations_filtered/f0sDG0nnftw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 40.37], [51.0, 51.85], [53.0, 53.25], [54.0, 62.99], [79.0, 86.36], [91.0, 91.88], [95.0, 99.27], [101.0, 105.53]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.42, 80.82, 0.0, 78.21, 63.96], "audiomae_on_audioset": [null, null, null, [["music", 43.94], ["didgeridoo", 10.07], ["musical instrument", 9.0]], null, null, null, null], "duration": [33.37, 0.85, 0.25, 8.99, 7.36, 0.88, 4.27, 4.53]} \ No newline at end of file diff --git a/annotations_filtered/f0wEV9jySXg_filtered.json b/annotations_filtered/f0wEV9jySXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c6e1bb6fb7659f0bc46b57ef5ae3a9e97614828 --- /dev/null +++ b/annotations_filtered/f0wEV9jySXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [5.0, 5.17], [6.0, 7.75], [9.0, 9.64], [12.0, 11.72], [16.0, 16.88], [20.0, 20.88], [21.0, 22.4], [33.0, 33.84], [34.0, 35.9], [38.0, 39.39], [51.0, 51.6], [60.0, 59.97], [60.0, 60.69], [62.0, 63.1], [69.0, 70.21], [75.0, 75.63], [78.0, 82.0], [83.0, 84.69], [86.0, 89.63], [91.0, 92.31], [93.0, 94.81], [96.0, 96.08], [100.0, 100.52], [103.0, 103.94], [105.0, 105.6], [108.0, 108.21], [110.0, 110.17], [118.0, 123.2], [124.0, 125.25], [127.0, 129.39], [129.0, 130.59], [133.0, 142.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 100.0, 0.0, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.17, 1.75, 0.64, -0.28, 0.88, 0.88, 1.4, 0.84, 1.9, 1.39, 0.6, -0.03, 0.69, 1.1, 1.21, 0.63, 4.0, 1.69, 3.63, 1.31, 1.81, 0.08, 0.52, 0.94, 0.6, 0.21, 0.17, 5.2, 1.25, 2.39, 1.59, 9.01]} \ No newline at end of file diff --git a/annotations_filtered/f187FGFi1AM_filtered.json b/annotations_filtered/f187FGFi1AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e50006310d145949bd683ddfd2e15c83a0d6ab9 --- /dev/null +++ b/annotations_filtered/f187FGFi1AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.13], [8.0, 9.85], [11.0, 17.17], [18.0, 24.78], [25.0, 25.1], [25.0, 26.55], [27.0, 32.22], [32.0, 33.0], [34.0, 35.78], [36.0, 64.99], [66.0, 67.51], [69.0, 79.95], [81.0, 83.19], [84.0, 84.67], [86.0, 87.15], [89.0, 90.73], [91.0, 121.1], [122.0, 122.55], [124.0, 124.44], [125.0, 125.64]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [65.09, 0.0, 33.75, 38.6, 0.0, 0.0, 34.58, 0.0, 0.0, 46.79, 0.0, 33.49, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.24], ["effects unit", 8.84], ["musical instrument", 8.26]], [["music", 68.13], ["theremin", 19.21], ["musical instrument", 2.65]], null, null, [["music", 42.66], ["theremin", 19.64], ["musical instrument", 9.06]], null, null, [["music", 51.97], ["mains hum", 18.42], ["hum", 13.39]], null, [["mains hum", 23.93], ["hum", 22.3], ["speech", 22.11]], null, null, null, null, null, null, null, null], "duration": [2.13, 1.85, 6.17, 6.78, 0.1, 1.55, 5.22, 1.0, 1.78, 28.99, 1.51, 10.95, 2.19, 0.67, 1.15, 1.73, 30.1, 0.55, 0.44, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/f1N8-L5cuWQ_filtered.json b/annotations_filtered/f1N8-L5cuWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31f76937bbe8c4d03fa4f5ced498dec1b39dc44f --- /dev/null +++ b/annotations_filtered/f1N8-L5cuWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.77], [13.0, 14.34], [18.0, 18.28], [19.0, 21.34], [25.0, 26.52], [30.0, 30.3], [34.0, 34.23], [35.0, 42.2], [43.0, 51.53], [54.0, 55.31], [58.0, 59.36], [67.0, 74.68], [75.0, 79.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.6, 0.0, 0.0, 43.74, 0.0, 0.0, 0.0, 45.36, 59.24, 0.0, 0.0, 32.9, 35.91], "audiomae_on_audioset": [[["speech", 38.31], ["music", 26.71], ["hum", 10.25]], null, null, [["music", 41.61], ["didgeridoo", 21.74], ["quack", 8.38]], null, null, null, [["music", 59.33], ["speech", 16.9], ["hum", 5.7]], null, null, null, [["music", 51.0], ["didgeridoo", 33.82], ["speech", 5.47]], [["music", 43.02], ["hum", 13.8], ["speech", 13.45]]], "duration": [8.77, 1.34, 0.28, 2.34, 1.52, 0.3, 0.23, 7.2, 8.53, 1.31, 1.36, 7.68, 4.15]} \ No newline at end of file diff --git a/annotations_filtered/f1Nh9DlkZ1w_filtered.json b/annotations_filtered/f1Nh9DlkZ1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd9a330aa9ffe922b4b182988b001d97b50165c0 --- /dev/null +++ b/annotations_filtered/f1Nh9DlkZ1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 22.44], [23.0, 23.45], [25.0, 49.44]], "keep_status": [true, false, true], "silence_prob": [32.4, 0.0, 41.42], "audiomae_on_audioset": [[["cattle, bovinae", 17.88], ["livestock, farm animals, working animals", 15.71], ["moo", 15.59]], null, [["clip-clop", 31.47], ["horse", 21.88], ["animal", 7.54]]], "duration": [15.44, 0.45, 24.44]} \ No newline at end of file diff --git a/annotations_filtered/f1bk5a_jaEA_filtered.json b/annotations_filtered/f1bk5a_jaEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66a26ddd90f09051a41dd89b48c7e148e2a6efdd --- /dev/null +++ b/annotations_filtered/f1bk5a_jaEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.83], [31.0, 31.97], [34.0, 38.6], [40.0, 40.49], [41.0, 57.16], [58.0, 62.01], [77.0, 76.65], [79.0, 78.93], [83.0, 85.68], [89.0, 101.06], [102.0, 102.93], [103.0, 103.81], [104.0, 150.63], [152.0, 154.8], [157.0, 158.16], [161.0, 172.3], [177.0, 177.15], [177.0, 178.09], [179.0, 179.0], [180.0, 179.86], [188.0, 212.45], [218.0, 225.9]], "keep_status": [false, false, true, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.86, 0.0, 34.94, 30.54, 0.0, 0.0, 30.66, 31.95, 0.0, 0.0, 0.0, 31.69, 0.0, 29.96, 0.0, 0.0, 0.0, 0.0, 31.57, 30.94], "audiomae_on_audioset": [null, null, [["music", 48.99], ["marimba, xylophone", 6.3], ["glockenspiel", 4.12]], null, [["music", 71.17], ["brass instrument", 4.08], ["echo", 2.93]], [["music", 34.83], ["effects unit", 6.56], ["musical instrument", 5.73]], null, null, [["chant", 28.32], ["choir", 12.67], ["music", 12.61]], [["music", 46.92], ["musical instrument", 13.39], ["brass instrument", 5.44]], null, null, null, [["sidetone", 29.36], ["music", 12.03], ["fly, housefly", 10.36]], null, [["music", 73.8], ["theremin", 4.44], ["singing", 2.16]], null, null, null, null, [["music", 36.68], ["didgeridoo", 33.97], ["theremin", 14.9]], [["music", 42.67], ["animal", 11.55], ["noise", 10.9]]], "duration": [1.83, 0.97, 4.6, 0.49, 16.16, 4.01, -0.35, -0.07, 2.68, 12.06, 0.93, 0.81, 46.63, 2.8, 1.16, 11.3, 0.15, 1.09, 0.0, -0.14, 24.45, 7.9]} \ No newline at end of file diff --git a/annotations_filtered/f1fSmptANOU_filtered.json b/annotations_filtered/f1fSmptANOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d5db1a42a457e99f177623a112b35d837a6325 --- /dev/null +++ b/annotations_filtered/f1fSmptANOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.2], [32.0, 32.56], [33.0, 38.6], [43.0, 52.54], [55.0, 56.22], [58.0, 64.45], [67.0, 72.17], [73.0, 73.09], [73.0, 74.01], [75.0, 75.76], [78.0, 78.97], [95.0, 95.32], [96.0, 96.67], [98.0, 98.39], [99.0, 99.33], [101.0, 100.84], [101.0, 101.76], [103.0, 104.14]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.2, 30.89, 0.0, 30.59, 41.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.07], ["musical instrument", 7.22], ["noise", 6.32]], [["music", 85.03], ["cacophony", 2.72], ["didgeridoo", 2.32]], null, [["music", 45.42], ["cacophony", 12.36], ["sound effect", 5.73]], [["music", 36.98], ["didgeridoo", 20.6], ["synthesizer", 5.16]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 0.56, 5.6, 9.54, 1.22, 6.45, 5.17, 0.09, 1.01, 0.76, 0.97, 0.32, 0.67, 0.39, 0.33, -0.16, 0.76, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/f1mbRj3ejAk_filtered.json b/annotations_filtered/f1mbRj3ejAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e74efa0197d77af7ace0001d20a95c3ac937f93a --- /dev/null +++ b/annotations_filtered/f1mbRj3ejAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.45], [25.0, 26.62], [28.0, 28.31], [30.0, 31.53], [33.0, 33.08], [35.0, 35.19], [36.0, 36.61], [38.0, 38.37], [45.0, 50.4], [51.0, 51.93], [55.0, 57.77], [58.0, 58.13], [59.0, 61.33], [62.0, 76.59], [80.0, 83.1]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 34.73, 0.0, 32.89, 33.06, 32.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 27.47], ["music", 15.36], ["tick-tock", 5.7]], null, [["music", 30.57], ["throbbing", 29.6], ["hum", 13.84]], null, [["music", 50.36], ["didgeridoo", 12.81], ["speech", 3.37]], [["music", 26.82], ["hum", 19.1], ["throbbing", 14.77]], [["speech", 28.3], ["hum", 12.41], ["music", 11.35]]], "duration": [2.45, 1.62, 0.31, 1.53, 0.08, 0.19, 0.61, 0.37, 5.4, 0.93, 2.77, 0.13, 2.33, 14.59, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/f20aUH5IG9s_filtered.json b/annotations_filtered/f20aUH5IG9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d15fb3f919d1bef99b03c0c35b878134f0ad39cf --- /dev/null +++ b/annotations_filtered/f20aUH5IG9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [6.0, 6.32], [7.0, 7.43], [8.0, 11.53], [13.0, 14.08], [15.0, 19.36], [22.0, 23.19], [24.0, 25.44], [26.0, 26.11], [28.0, 28.49], [29.0, 32.49], [35.0, 36.17], [40.0, 40.85], [42.0, 42.35], [43.0, 43.39], [46.0, 47.65], [50.0, 50.6], [51.0, 51.27], [53.0, 54.06], [56.0, 57.75], [59.0, 62.83], [64.0, 65.96], [74.0, 73.97], [76.0, 77.52], [79.0, 80.23], [83.0, 82.83], [84.0, 84.92], [89.0, 91.86], [92.0, 96.28], [103.0, 104.45], [115.0, 115.94], [117.0, 117.93], [124.0, 124.28], [127.0, 127.68], [130.0, 130.38], [132.0, 133.08], [134.0, 136.83], [139.0, 141.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 0.32, 0.43, 3.53, 1.08, 4.36, 1.19, 1.44, 0.11, 0.49, 3.49, 1.17, 0.85, 0.35, 0.39, 1.65, 0.6, 0.27, 1.06, 1.75, 3.83, 1.96, -0.03, 1.52, 1.23, -0.17, 0.92, 2.86, 4.28, 1.45, 0.94, 0.93, 0.28, 0.68, 0.38, 1.08, 2.83, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/f2FzrfnfQPY_filtered.json b/annotations_filtered/f2FzrfnfQPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e5be64a0c96034bab94ed0b1c3fac0b74580cb1 --- /dev/null +++ b/annotations_filtered/f2FzrfnfQPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.55], [10.0, 11.21], [13.0, 13.8], [16.0, 17.46], [20.0, 21.95], [25.0, 25.14], [26.0, 26.25], [32.0, 31.95], [33.0, 33.54], [36.0, 37.32], [38.0, 38.52], [42.0, 42.74], [44.0, 45.96], [47.0, 48.9], [54.0, 54.8], [64.0, 65.43], [76.0, 79.15], [81.0, 84.2], [86.0, 88.03], [95.0, 106.95], [112.0, 112.24], [114.0, 116.16], [118.0, 121.17], [124.0, 128.17], [133.0, 135.38], [137.0, 139.04], [145.0, 146.4], [149.0, 150.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 31.92, 38.16, 29.65, 0.0, 29.59, 32.8, 46.33, 28.92, 40.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.92], ["mains hum", 29.22], ["fly, housefly", 7.01]], [["whack, thwack", 14.03], ["vehicle", 10.43], ["car", 8.64]], [["throbbing", 24.06], ["music", 23.79], ["hum", 19.79]], [["music", 35.49], ["hum", 12.77], ["mains hum", 8.48]], null, [["music", 63.44], ["theremin", 4.51], ["sound effect", 3.46]], [["music", 25.91], ["hum", 10.22], ["pulse", 6.58]], [["music", 33.48], ["hum", 16.28], ["throbbing", 7.46]], [["music", 54.86], ["musical instrument", 3.91], ["whale vocalization", 3.62]], [["speech", 32.0], ["hum", 16.13], ["music", 15.54]], null, null], "duration": [1.55, 1.21, 0.8, 1.46, 1.95, 0.14, 0.25, -0.05, 0.54, 1.32, 0.52, 0.74, 1.96, 1.9, 0.8, 1.43, 3.15, 3.2, 2.03, 11.95, 0.24, 2.16, 3.17, 4.17, 2.38, 2.04, 1.4, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/f2Hz2k2PcfI_filtered.json b/annotations_filtered/f2Hz2k2PcfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a3e49abaaaa6d267ea25144b61e9f3c77ad14c --- /dev/null +++ b/annotations_filtered/f2Hz2k2PcfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.66], [30.0, 32.16], [35.0, 38.03], [39.0, 40.88], [61.0, 62.55], [64.0, 64.71], [74.0, 75.07], [81.0, 81.84], [84.0, 86.04], [90.0, 90.46], [96.0, 97.34], [99.0, 100.41], [102.0, 102.3], [116.0, 117.86], [119.0, 120.19], [121.0, 122.52], [123.0, 123.57], [125.0, 125.07], [136.0, 136.76], [143.0, 143.45], [145.0, 148.63], [150.0, 151.55], [153.0, 154.75], [159.0, 159.71], [164.0, 167.88], [170.0, 170.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.07, 87.37, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.66, 2.16, 3.03, 1.88, 1.55, 0.71, 1.07, 0.84, 2.04, 0.46, 1.34, 1.41, 0.3, 1.86, 1.19, 1.52, 0.57, 0.07, 0.76, 0.45, 3.63, 1.55, 1.75, 0.71, 3.88, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/f2SskRLd4F4_filtered.json b/annotations_filtered/f2SskRLd4F4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f0219a3586ab0d865dd5fe2271b6799c2593b48 --- /dev/null +++ b/annotations_filtered/f2SskRLd4F4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [18.0, 34.16], [35.0, 39.88], [41.0, 59.73], [60.0, 62.36], [64.0, 66.38], [68.0, 76.47], [79.0, 95.45]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.51, 99.96, 78.55, 99.99, 99.96, 90.08, 46.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 69.23], ["theremin", 7.42], ["musical instrument", 4.28]]], "duration": [0.88, 16.16, 4.88, 18.73, 2.36, 2.38, 8.47, 16.45]} \ No newline at end of file diff --git a/annotations_filtered/f2c-tMZSZtY_filtered.json b/annotations_filtered/f2c-tMZSZtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..663b90c95be36d34ca807f46f1f79543707d7475 --- /dev/null +++ b/annotations_filtered/f2c-tMZSZtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 34.05], [34.0, 42.7], [49.0, 50.97], [58.0, 59.04], [60.0, 60.17], [63.0, 64.47], [66.0, 66.77], [73.0, 78.88], [81.0, 83.02], [86.0, 89.48], [97.0, 97.31], [97.0, 97.92], [98.0, 98.91], [99.0, 98.96], [100.0, 102.22], [113.0, 113.8], [119.0, 122.44], [123.0, 154.28]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false], "silence_prob": [58.81, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 41.66, 53.22, 45.88, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 33.06, 0.0], "audiomae_on_audioset": [null, [["speech", 60.01], ["music", 10.89], ["electric shaver, electric razor", 4.18]], null, null, null, null, null, [["music", 52.11], ["hum", 6.59], ["throbbing", 4.05]], null, [["music", 18.22], ["moo", 16.91], ["cattle, bovinae", 16.21]], null, null, null, null, null, null, [["music", 36.73], ["speech", 22.46], ["animal", 2.85]], null], "duration": [3.05, 8.7, 1.97, 1.04, 0.17, 1.47, 0.77, 5.88, 2.02, 3.48, 0.31, 0.92, 0.91, -0.04, 2.22, 0.8, 3.44, 31.28]} \ No newline at end of file diff --git a/annotations_filtered/f2ugRkVMOuE_filtered.json b/annotations_filtered/f2ugRkVMOuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efc1077179f3161a173c2e3dbd089cad589ecdd4 --- /dev/null +++ b/annotations_filtered/f2ugRkVMOuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [7.0, 7.45], [8.0, 9.81], [13.0, 15.36], [17.0, 17.05], [18.0, 20.19], [22.0, 22.92], [23.0, 24.27], [26.0, 27.08], [30.0, 30.28], [35.0, 35.36], [36.0, 40.31], [44.0, 49.32], [50.0, 59.8], [60.0, 61.28], [64.0, 64.08], [64.0, 66.19], [67.0, 68.66], [73.0, 80.28], [82.0, 82.19], [87.0, 93.36], [104.0, 110.1], [112.0, 115.48], [120.0, 122.96], [126.0, 126.91], [128.0, 128.58]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.93, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 60.14, 42.42, 0.0, 0.0, 37.61, 0.0, 34.51, 0.0, 33.7, 34.76, 39.82, 37.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 34.65], ["animal", 10.3], ["whimper", 4.86]], null, null, null, null, null, null, null, null, null, [["music", 54.68], ["speech", 14.95], ["wind instrument, woodwind instrument", 7.27]], null, null, [["music", 78.02], ["musical instrument", 3.58], ["guitar", 1.29]], null, [["music", 72.24], ["singing", 2.81], ["musical instrument", 2.21]], null, [["music", 66.72], ["musical instrument", 6.11], ["guitar", 5.36]], [["music", 70.44], ["music of bollywood", 6.5], ["singing", 3.32]], [["music", 75.66], ["speech", 4.04], ["bleat", 1.1]], [["music", 35.62], ["sidetone", 26.31], ["speech", 12.79]], null, null], "duration": [0.79, 0.45, 1.81, 2.36, 0.05, 2.19, 0.92, 1.27, 1.08, 0.28, 0.36, 4.31, 5.32, 9.8, 1.28, 0.08, 2.19, 1.66, 7.28, 0.19, 6.36, 6.1, 3.48, 2.96, 0.91, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/f39I-UCl9Qo_filtered.json b/annotations_filtered/f39I-UCl9Qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3ee4505b1b03b845d503cadca08a462e03ecb1e --- /dev/null +++ b/annotations_filtered/f39I-UCl9Qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [4.0, 4.7], [6.0, 6.59], [7.0, 8.99], [10.0, 10.67], [11.0, 11.62], [13.0, 36.9], [38.0, 39.77], [42.0, 47.83], [49.0, 54.65], [56.0, 59.76], [61.0, 62.19], [64.0, 64.71], [65.0, 66.82], [67.0, 70.98], [72.0, 77.11], [78.0, 88.52], [89.0, 90.58], [91.0, 94.46], [96.0, 99.72], [103.0, 119.67], [122.0, 128.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 100.0, 99.84, 94.95, 0.0, 0.0, 0.0, 100.0, 99.98, 100.0, 0.0, 93.91, 94.07, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 0.7, 0.59, 1.99, 0.67, 0.62, 23.9, 1.77, 5.83, 5.65, 3.76, 1.19, 0.71, 1.82, 3.98, 5.11, 10.52, 1.58, 3.46, 3.72, 16.67, 6.43]} \ No newline at end of file diff --git a/annotations_filtered/f3XcExCD3HM_filtered.json b/annotations_filtered/f3XcExCD3HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b260c07faed965d2ee9e136fc274a6fbcf3b759 --- /dev/null +++ b/annotations_filtered/f3XcExCD3HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.09], [15.0, 15.69], [17.0, 17.98], [19.0, 20.19], [21.0, 22.25], [30.0, 30.42], [35.0, 36.64], [40.0, 40.04], [43.0, 43.06], [47.0, 48.54], [54.0, 53.97], [55.0, 55.26], [57.0, 57.92], [59.0, 60.56], [62.0, 64.0], [65.0, 66.43], [67.0, 68.44], [71.0, 71.2], [73.0, 73.95], [75.0, 75.41], [79.0, 80.37], [85.0, 86.36], [89.0, 90.83], [98.0, 99.49], [100.0, 100.18], [105.0, 105.93], [107.0, 108.41], [113.0, 114.39], [117.0, 125.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.69, 0.98, 1.19, 1.25, 0.42, 1.64, 0.04, 0.06, 1.54, -0.03, 0.26, 0.92, 1.56, 2.0, 1.43, 1.44, 0.2, 0.95, 0.41, 1.37, 1.36, 1.83, 1.49, 0.18, 0.93, 1.41, 1.39, 8.29]} \ No newline at end of file diff --git a/annotations_filtered/f3tseBsU248_filtered.json b/annotations_filtered/f3tseBsU248_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f85a5cab701b4988fa095d3ec3fca474d30786e5 --- /dev/null +++ b/annotations_filtered/f3tseBsU248_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.48], [29.0, 28.58], [52.0, 52.15], [55.0, 55.19], [55.0, 55.83], [56.0, 56.29], [57.0, 58.24], [61.0, 62.6], [63.0, 63.32], [70.0, 70.04], [75.0, 77.11], [83.0, 84.13], [85.0, 85.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, -0.42, 0.15, 0.19, 0.83, 0.29, 1.24, 1.6, 0.32, 0.04, 2.11, 1.13, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/f3u4j0hVy8c_filtered.json b/annotations_filtered/f3u4j0hVy8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb745f87ccc08b2ac4f514560848bc5ff721e5fd --- /dev/null +++ b/annotations_filtered/f3u4j0hVy8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.39], [24.0, 42.15], [43.0, 43.73], [44.0, 50.67], [54.0, 54.41], [56.0, 61.38], [64.0, 64.45], [67.0, 67.95], [69.0, 69.33], [71.0, 72.81], [77.0, 78.16], [82.0, 82.68], [84.0, 85.43], [86.0, 86.85], [94.0, 95.86], [98.0, 100.25], [105.0, 106.54], [109.0, 109.86], [112.0, 112.18], [113.0, 113.81], [116.0, 115.79], [116.0, 117.61], [119.0, 120.85], [121.0, 120.93], [121.0, 121.37], [123.0, 123.26], [124.0, 124.48], [127.0, 128.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.72, 45.95, 0.0, 41.07, 0.0, 38.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.35], ["didgeridoo", 15.72], ["musical instrument", 3.14]], [["music", 71.26], ["speech", 5.87], ["theremin", 3.15]], null, [["music", 84.93], ["didgeridoo", 7.01], ["musical instrument", 2.44]], null, [["music", 75.91], ["didgeridoo", 6.86], ["theremin", 3.02]], null, null, null, null, null, null, null, null, null, [["whale vocalization", 43.29], ["speech", 18.93], ["music", 11.09]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.39, 18.15, 0.73, 6.67, 0.41, 5.38, 0.45, 0.95, 0.33, 1.81, 1.16, 0.68, 1.43, 0.85, 1.86, 2.25, 1.54, 0.86, 0.18, 0.81, -0.21, 1.61, 1.85, -0.07, 0.37, 0.26, 0.48, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/f48wH7l3c5I_filtered.json b/annotations_filtered/f48wH7l3c5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed4203b0a78f9e1ff0a18aa2697a42c95ef8d625 --- /dev/null +++ b/annotations_filtered/f48wH7l3c5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.49], [10.0, 11.08], [13.0, 14.71], [15.0, 18.13], [21.0, 21.63], [29.0, 30.2], [35.0, 35.16], [36.0, 38.18], [39.0, 45.28], [47.0, 57.3], [70.0, 74.75], [78.0, 79.05], [86.0, 90.24], [102.0, 104.18], [106.0, 108.78], [111.0, 116.29]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 33.39, 0.0, 0.0, 0.0, 30.11, 29.98, 30.67, 31.7, 0.0, 29.76, 32.77, 31.54, 30.76], "audiomae_on_audioset": [null, null, null, [["hum", 27.8], ["mains hum", 23.14], ["speech", 21.49]], null, null, null, [["hum", 19.99], ["mains hum", 10.55], ["sound effect", 9.36]], [["music", 20.18], ["vehicle", 14.5], ["hum", 12.35]], [["music", 60.04], ["synthesizer", 8.21], ["musical instrument", 6.06]], [["music", 45.83], ["hum", 12.53], ["throbbing", 8.43]], null, [["whale vocalization", 19.34], ["sound effect", 11.69], ["echo", 7.1]], [["music", 11.4], ["whale vocalization", 10.92], ["synthesizer", 7.71]], [["buzz", 23.65], ["mains hum", 17.67], ["hum", 11.27]], [["hum", 23.27], ["mains hum", 16.05], ["breaking", 14.76]]], "duration": [1.49, 1.08, 1.71, 3.13, 0.63, 1.2, 0.16, 2.18, 6.28, 10.3, 4.75, 1.05, 4.24, 2.18, 2.78, 5.29]} \ No newline at end of file diff --git a/annotations_filtered/f4LEgmt0roE_filtered.json b/annotations_filtered/f4LEgmt0roE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6971f69435405ce0cbe2dee87e7129b36aeb9d54 --- /dev/null +++ b/annotations_filtered/f4LEgmt0roE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.86], [18.0, 18.15], [22.0, 22.67], [79.0, 79.25], [88.0, 90.15], [95.0, 94.96], [99.0, 99.71], [106.0, 107.76], [108.0, 108.75]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.15, 0.67, 0.25, 2.15, -0.04, 0.71, 1.76, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/f4M5MT96FwY_filtered.json b/annotations_filtered/f4M5MT96FwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63c4129bb95a70029877c4418a0e5c6b8e8a8c3f --- /dev/null +++ b/annotations_filtered/f4M5MT96FwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [13.0, 13.73], [15.0, 22.2], [34.0, 35.97]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 32.51, 0.0], "audiomae_on_audioset": [null, null, [["music", 27.79], ["hum", 23.02], ["mains hum", 10.1]], null], "duration": [0.44, 0.73, 7.2, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/f4gmgTebHog_filtered.json b/annotations_filtered/f4gmgTebHog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecc79f3b3a0686f5f2e17d7b3378155362bedf38 --- /dev/null +++ b/annotations_filtered/f4gmgTebHog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [6.0, 6.96], [9.0, 25.51], [26.0, 64.93], [69.0, 71.09], [72.0, 74.53], [77.0, 78.68], [80.0, 87.57], [88.0, 89.04], [90.0, 94.95], [99.0, 140.54], [141.0, 155.22], [158.0, 158.57], [162.0, 161.99], [163.0, 164.62], [168.0, 169.67], [174.0, 175.41], [179.0, 180.76], [182.0, 182.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.9, 0.0, 75.23, 55.81, 0.0, 40.31, 0.0, 34.39, 0.0, 30.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.35], ["hum", 9.54], ["sonar", 6.95]], null, null, null, null, [["music", 65.75], ["hum", 8.59], ["throbbing", 4.94]], null, [["music", 73.53], ["musical instrument", 6.1], ["guitar", 2.16]], null, [["music", 80.6], ["theremin", 5.71], ["scary music", 2.48]], null, null, null, null, null, null, null], "duration": [0.94, 0.96, 16.51, 38.93, 2.09, 2.53, 1.68, 7.57, 1.04, 4.95, 41.54, 14.22, 0.57, -0.01, 1.62, 1.67, 1.41, 1.76, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/f4ojzsvQhh0_filtered.json b/annotations_filtered/f4ojzsvQhh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cbbad2a9a42f8548743c04a2b049f5efd1dc824 --- /dev/null +++ b/annotations_filtered/f4ojzsvQhh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [11.0, 12.18], [13.0, 13.17], [13.0, 21.95], [24.0, 23.72], [28.0, 30.08], [35.0, 36.53], [42.0, 44.14], [46.0, 47.09], [50.0, 51.8], [55.0, 58.35], [59.0, 61.32], [62.0, 63.36], [66.0, 67.85], [70.0, 72.72]], "keep_status": [false, false, false, true, false, true, false, true, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.05, 0.0, 40.71, 0.0, 37.17, 0.0, 0.0, 37.57, 39.96, 0.0, 0.0, 33.1], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 44.11], ["noise", 14.32], ["throbbing", 6.48]], null, [["hum", 28.59], ["mains hum", 21.8], ["music", 8.83]], null, [["hum", 33.3], ["mains hum", 12.71], ["whale vocalization", 5.35]], null, null, [["music", 22.52], ["hum", 16.29], ["rumble", 11.1]], [["hum", 35.51], ["mains hum", 13.57], ["music", 10.6]], null, null, [["speech", 55.74], ["sidetone", 26.44], ["whale vocalization", 5.12]]], "duration": [0.97, 1.18, 0.17, 8.95, -0.28, 2.08, 1.53, 2.14, 1.09, 1.8, 3.35, 2.32, 1.36, 1.85, 2.72]} \ No newline at end of file diff --git a/annotations_filtered/f4wQCy4xIyY_filtered.json b/annotations_filtered/f4wQCy4xIyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c2e12101604cda041278959079082225d400b4 --- /dev/null +++ b/annotations_filtered/f4wQCy4xIyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.24], [13.0, 18.15], [19.0, 19.55], [21.0, 20.93], [22.0, 22.35], [23.0, 35.67], [36.0, 37.5], [39.0, 103.57], [105.0, 113.14], [115.0, 128.44]], "keep_status": [true, false, false, false, false, true, false, false, true, true], "silence_prob": [39.0, 51.55, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 30.39, 31.29], "audiomae_on_audioset": [[["hum", 14.98], ["music", 9.65], ["mains hum", 4.86]], null, null, null, null, [["whack, thwack", 45.92], ["quack", 8.91], ["speech", 8.16]], null, null, [["music", 44.07], ["electronic music", 13.89], ["synthesizer", 8.07]], [["music", 39.16], ["synthesizer", 9.99], ["car", 7.34]]], "duration": [2.24, 5.15, 0.55, -0.07, 0.35, 12.67, 1.5, 64.57, 8.14, 13.44]} \ No newline at end of file diff --git a/annotations_filtered/f4wmj-Nq9xA_filtered.json b/annotations_filtered/f4wmj-Nq9xA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba272ed2de4d8fdd257da8624ed29b16d7f2c4f1 --- /dev/null +++ b/annotations_filtered/f4wmj-Nq9xA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.26], [13.0, 13.44], [23.0, 22.79], [51.0, 51.49], [66.0, 66.77], [69.0, 69.72], [73.0, 75.57], [77.0, 78.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.26, 0.44, -0.21, 0.49, 0.77, 0.72, 2.57, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/f4zl3CuJvt8_filtered.json b/annotations_filtered/f4zl3CuJvt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bffe0baef51abfca66005f3f409a613a9a5e1e0f --- /dev/null +++ b/annotations_filtered/f4zl3CuJvt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.84], [9.0, 41.89], [43.0, 44.07], [49.0, 53.27], [54.0, 73.11], [75.0, 83.93], [86.0, 89.02], [90.0, 92.04], [93.0, 98.49], [102.0, 108.31], [111.0, 111.05], [112.0, 112.53], [126.0, 137.17], [139.0, 139.29], [140.0, 144.24], [146.0, 147.41], [148.0, 150.18], [152.0, 166.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.6, 30.81, 58.13, 99.36, 89.19, 79.07, 36.88, 0.0, 0.0, 31.9, 0.0, 72.75, 0.0, 90.08, 32.37], "audiomae_on_audioset": [null, null, null, [["music", 30.72], ["throbbing", 21.43], ["hum", 20.26]], [["cattle, bovinae", 34.71], ["livestock, farm animals, working animals", 23.24], ["moo", 20.93]], null, null, null, null, [["music", 70.31], ["hum", 4.57], ["synthesizer", 4.0]], null, null, [["music", 63.22], ["didgeridoo", 6.42], ["synthesizer", 4.16]], null, null, null, null, [["music", 66.84], ["didgeridoo", 4.72], ["musical instrument", 3.75]]], "duration": [-0.16, 32.89, 1.07, 4.27, 19.11, 8.93, 3.02, 2.04, 5.49, 6.31, 0.05, 0.53, 11.17, 0.29, 4.24, 1.41, 2.18, 14.87]} \ No newline at end of file diff --git a/annotations_filtered/f505OHOUHoU_filtered.json b/annotations_filtered/f505OHOUHoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7c75e1b8ee4008940750668568dd924a12e2790 --- /dev/null +++ b/annotations_filtered/f505OHOUHoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[97.0, 101.71], [107.0, 113.88], [116.0, 117.27], [119.0, 124.16], [126.0, 127.52]], "keep_status": [true, true, false, true, false], "silence_prob": [43.61, 45.05, 0.0, 38.15, 0.0], "audiomae_on_audioset": [[["music", 29.75], ["didgeridoo", 14.16], ["hum", 10.71]], [["music", 23.03], ["hum", 15.28], ["whale vocalization", 10.38]], null, [["music", 44.99], ["sonar", 7.4], ["electronic music", 6.32]], null], "duration": [4.71, 6.88, 1.27, 5.16, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/f57Vat6YZUI_filtered.json b/annotations_filtered/f57Vat6YZUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76f33ab3fc0642dad02d20080acd9387a4aca03a --- /dev/null +++ b/annotations_filtered/f57Vat6YZUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [8.0, 9.15], [12.0, 13.76], [18.0, 18.82], [22.0, 24.71], [26.0, 26.43], [31.0, 31.67], [44.0, 52.08], [54.0, 62.4], [64.0, 87.49], [92.0, 96.55], [99.0, 107.64], [108.0, 120.45], [124.0, 145.62], [147.0, 148.91]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0, 32.99, 32.11, 32.18, 31.72, 31.8, 31.43, 30.86, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 31.73], ["hum", 20.46], ["mains hum", 17.22]], null, null, [["music", 42.8], ["hum", 25.81], ["throbbing", 16.19]], [["music", 81.6], ["singing", 0.98], ["music of bollywood", 0.9]], [["music", 80.16], ["throbbing", 3.88], ["hum", 2.89]], [["music", 58.77], ["throbbing", 5.17], ["hum", 4.6]], [["music", 46.69], ["hum", 11.18], ["mains hum", 7.27]], [["music", 64.44], ["hum", 9.92], ["throbbing", 8.0]], [["music", 87.48], ["musical instrument", 0.98], ["carnatic music", 0.73]], null], "duration": [1.57, 1.15, 1.76, 0.82, 2.71, 0.43, 0.67, 8.08, 8.4, 23.49, 4.55, 8.64, 12.45, 21.62, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/f58Ba78abHg_filtered.json b/annotations_filtered/f58Ba78abHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdf20f6507bd047e4e48cb80849fcaa09daa573 --- /dev/null +++ b/annotations_filtered/f58Ba78abHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.98], [6.0, 7.59], [9.0, 9.26], [15.0, 16.97], [19.0, 26.18], [27.0, 28.34], [32.0, 36.71], [38.0, 43.04], [44.0, 45.96], [47.0, 48.9], [50.0, 50.84], [53.0, 54.55], [58.0, 58.72], [59.0, 76.18], [77.0, 78.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.61, 0.0, 49.0, 58.81, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.26], ["gong", 23.41], ["singing bowl", 16.74]], null, null, null, null, null, null, [["music", 49.09], ["synthesizer", 13.45], ["ambient music", 7.68]], null], "duration": [0.98, 1.59, 0.26, 1.97, 7.18, 1.34, 4.71, 5.04, 1.96, 1.9, 0.84, 1.55, 0.72, 17.18, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/f5e73A39TF4_filtered.json b/annotations_filtered/f5e73A39TF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f963c7575469ce8fd3be51e587364ea73bf4266b --- /dev/null +++ b/annotations_filtered/f5e73A39TF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [5.0, 5.88], [20.0, 23.33], [26.0, 26.81], [32.0, 33.76], [35.0, 36.12], [40.0, 41.5], [49.0, 50.3], [51.0, 52.41], [57.0, 56.88], [60.0, 60.61], [64.0, 65.92], [74.0, 75.93], [77.0, 79.84], [100.0, 100.97], [106.0, 106.12], [107.0, 107.28], [110.0, 111.42], [115.0, 116.46], [121.0, 123.5], [126.0, 125.91], [129.0, 131.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.88, 3.33, 0.81, 1.76, 1.12, 1.5, 1.3, 1.41, -0.12, 0.61, 1.92, 1.93, 2.84, 0.97, 0.12, 0.28, 1.42, 1.46, 2.5, -0.09, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/f5f86alm7jk_filtered.json b/annotations_filtered/f5f86alm7jk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e2f67dbea46d7e26c82beccf6d388c068edbb33 --- /dev/null +++ b/annotations_filtered/f5f86alm7jk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [7.0, 7.25], [9.0, 9.17], [11.0, 11.26], [12.0, 12.77], [15.0, 16.09], [18.0, 18.54], [19.0, 22.23], [26.0, 28.51], [29.0, 33.03], [36.0, 36.54], [39.0, 40.39], [55.0, 56.2], [57.0, 57.94], [59.0, 61.69], [62.0, 63.51], [71.0, 71.52], [80.0, 83.07], [85.0, 85.43], [89.0, 88.7], [104.0, 104.35], [107.0, 107.79], [110.0, 111.03], [114.0, 114.86], [117.0, 117.69], [118.0, 119.75], [122.0, 123.92], [125.0, 126.5], [128.0, 128.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.36, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["thunk", 24.79], ["speech", 18.16], ["boing", 16.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.25, 0.17, 0.26, 0.77, 1.09, 0.54, 3.23, 2.51, 4.03, 0.54, 1.39, 1.2, 0.94, 2.69, 1.51, 0.52, 3.07, 0.43, -0.3, 0.35, 0.79, 1.03, 0.86, 0.69, 1.75, 1.92, 1.5, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/f5mcMmE3RL8_filtered.json b/annotations_filtered/f5mcMmE3RL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bd22f78230817170d9dd52b4c780116dc5cda44 --- /dev/null +++ b/annotations_filtered/f5mcMmE3RL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 33.71], [35.0, 201.43], [202.0, 210.61], [212.0, 212.75]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 41.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.85], ["didgeridoo", 20.38], ["mains hum", 6.89]], null], "duration": [30.71, 166.43, 8.61, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/f5umSa_YYX0_filtered.json b/annotations_filtered/f5umSa_YYX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54808daa7cc950249f83af3b102a0ba21b321b78 --- /dev/null +++ b/annotations_filtered/f5umSa_YYX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [6.0, 8.01], [12.0, 20.82], [22.0, 27.48], [34.0, 35.38], [46.0, 47.65], [57.0, 57.79], [61.0, 62.34], [82.0, 82.36], [84.0, 90.48], [92.0, 92.75], [93.0, 93.7], [96.0, 97.92], [98.0, 99.54], [100.0, 102.69], [105.0, 106.54], [107.0, 107.6], [108.0, 109.85], [110.0, 110.96], [112.0, 113.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.88, 100.0, 99.93, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 2.01, 8.82, 5.48, 1.38, 1.65, 0.79, 1.34, 0.36, 6.48, 0.75, 0.7, 1.92, 1.54, 2.69, 1.54, 0.6, 1.85, 0.96, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/f6DDYCf80hw_filtered.json b/annotations_filtered/f6DDYCf80hw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5dbd1cc12990ac9a4f1f6e370e662657ea94429 --- /dev/null +++ b/annotations_filtered/f6DDYCf80hw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.23], [14.0, 14.45], [16.0, 17.83], [19.0, 18.84], [21.0, 26.25], [30.0, 30.75], [33.0, 34.3], [36.0, 48.93], [50.0, 54.9], [56.0, 57.97], [59.0, 62.55], [64.0, 65.33], [69.0, 82.44], [84.0, 91.71], [96.0, 114.64], [117.0, 120.07], [124.0, 144.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 78.04, 77.36, 0.0, 74.76, 0.0, 50.76, 42.58, 36.94, 31.15, 38.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.71], ["music", 9.21], ["throbbing", 7.89]], [["speech", 49.38], ["music", 18.35], ["beatboxing", 6.0]], [["speech", 30.85], ["music", 11.07], ["didgeridoo", 4.9]], [["speech", 52.62], ["music", 11.98], ["hum", 9.68]]], "duration": [1.23, 0.45, 1.83, -0.16, 5.25, 0.75, 1.3, 12.93, 4.9, 1.97, 3.55, 1.33, 13.44, 7.71, 18.64, 3.07, 20.21]} \ No newline at end of file diff --git a/annotations_filtered/f6Dan7z0p4c_filtered.json b/annotations_filtered/f6Dan7z0p4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/f6Dan7z0p4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/f6F6MzMT2g8_filtered.json b/annotations_filtered/f6F6MzMT2g8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00649e2cc13bb03957e77a57ce3d9f145a56c040 --- /dev/null +++ b/annotations_filtered/f6F6MzMT2g8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.09], [13.0, 16.93], [18.0, 18.32], [19.0, 21.0], [24.0, 27.57], [28.0, 31.51], [35.0, 34.82], [43.0, 44.64], [46.0, 48.1], [57.0, 63.44], [72.0, 72.12], [74.0, 75.52], [78.0, 78.16], [80.0, 79.96], [82.0, 84.06], [92.0, 91.69], [95.0, 94.95], [96.0, 100.28], [113.0, 113.43], [114.0, 118.67], [120.0, 121.12], [122.0, 123.35], [126.0, 126.2], [130.0, 130.15], [144.0, 144.64]], "keep_status": [true, true, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.03, 32.04, 0.0, 44.72, 37.2, 38.27, 0.0, 0.0, 35.5, 34.92, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 0.0, 32.3, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.26], ["speech", 20.99], ["throbbing", 11.58]], [["music", 43.75], ["speech", 15.22], ["hum", 3.44]], null, [["speech", 20.27], ["music", 14.68], ["fly, housefly", 7.36]], [["music", 19.69], ["foghorn", 18.88], ["speech", 10.07]], [["music", 30.89], ["speech", 26.63], ["radio", 7.85]], null, null, [["music", 55.66], ["speech", 10.33], ["musical instrument", 3.42]], [["music", 63.02], ["throbbing", 5.72], ["noise", 5.58]], null, null, null, null, [["music", 74.66], ["synthesizer", 10.35], ["musical instrument", 4.21]], null, null, [["music", 38.66], ["speech", 17.93], ["hum", 11.79]], null, [["speech", 36.69], ["music", 28.19], ["hum", 9.87]], null, null, null, null, null], "duration": [6.09, 3.93, 0.32, 2.0, 3.57, 3.51, -0.18, 1.64, 2.1, 6.44, 0.12, 1.52, 0.16, -0.04, 2.06, -0.31, -0.05, 4.28, 0.43, 4.67, 1.12, 1.35, 0.2, 0.15, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/f6hhVIV_LPs_filtered.json b/annotations_filtered/f6hhVIV_LPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bcb34dc625ddea65e898825b2388cd73b2c36e --- /dev/null +++ b/annotations_filtered/f6hhVIV_LPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.43], [11.0, 12.28], [14.0, 14.74], [16.0, 16.53], [17.0, 17.25], [20.0, 20.09], [22.0, 21.93], [25.0, 25.32], [26.0, 27.31], [29.0, 29.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 1.28, 0.74, 0.53, 0.25, 0.09, -0.07, 0.32, 1.31, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/f6m4J0AfEOo_filtered.json b/annotations_filtered/f6m4J0AfEOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd046cde040290d099d94831eddca8cd68dccddd --- /dev/null +++ b/annotations_filtered/f6m4J0AfEOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.38], [26.0, 28.19], [30.0, 31.73], [32.0, 32.48], [32.0, 32.51], [33.0, 32.54], [33.0, 32.58], [33.0, 32.61], [33.0, 32.64], [33.0, 32.68], [33.0, 32.71], [33.0, 32.75], [33.0, 32.78], [33.0, 32.81], [33.0, 33.24], [33.0, 33.27], [35.0, 36.76], [38.0, 38.23], [41.0, 47.22], [48.0, 48.68], [53.0, 58.33], [59.0, 58.72], [66.0, 72.57], [74.0, 74.56], [78.0, 78.49], [83.0, 83.84], [91.0, 91.62], [93.0, 93.6]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 50.61, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 7.73], ["moo", 6.22], ["vehicle", 5.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.59], ["buzz", 6.8], ["musical instrument", 5.8]], null, null, null, null, null, null, null, null, null], "duration": [1.38, 2.19, 1.73, 0.48, 0.51, -0.46, -0.42, -0.39, -0.36, -0.32, -0.29, -0.25, -0.22, -0.19, 0.24, 0.27, 1.76, 0.23, 6.22, 0.68, 5.33, -0.28, 6.57, 0.56, 0.49, 0.84, 0.62, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/f7131IkiSCg_filtered.json b/annotations_filtered/f7131IkiSCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50bc6739cf6e96f68e3a306a2f5e816bef0e7996 --- /dev/null +++ b/annotations_filtered/f7131IkiSCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.78], [17.0, 16.82], [17.0, 19.36], [21.0, 21.93], [24.0, 23.97], [28.0, 28.83], [30.0, 33.34], [38.0, 43.58], [45.0, 45.0], [47.0, 48.68], [52.0, 52.54], [53.0, 53.86], [58.0, 59.64], [61.0, 61.74], [63.0, 64.96], [66.0, 68.79], [70.0, 71.73], [72.0, 73.79], [75.0, 76.35], [78.0, 80.52], [83.0, 85.02], [86.0, 85.89], [92.0, 92.89], [118.0, 124.53], [125.0, 124.75], [125.0, 135.84], [139.0, 140.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 65.32, 0.0, 0.0, 81.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, -0.18, 2.36, 0.93, -0.03, 0.83, 3.34, 5.58, 0.0, 1.68, 0.54, 0.86, 1.64, 0.74, 1.96, 2.79, 1.73, 1.79, 1.35, 2.52, 2.02, -0.11, 0.89, 6.53, -0.25, 10.84, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/f7l5I6ZPt_Y_filtered.json b/annotations_filtered/f7l5I6ZPt_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25ea6f117d624d49322552c6b42deaef9d8f3cb1 --- /dev/null +++ b/annotations_filtered/f7l5I6ZPt_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.93], [48.0, 56.34], [59.0, 59.91], [61.0, 62.55], [64.0, 73.94], [75.0, 77.11], [78.0, 85.09], [88.0, 89.65], [91.0, 91.29], [92.0, 92.42], [93.0, 94.83], [96.0, 97.75], [100.0, 100.2], [101.0, 101.63], [103.0, 105.58], [107.0, 108.38], [111.0, 114.12], [115.0, 115.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.48, 0.0, 0.0, 97.22, 74.76, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 0.0, 78.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 8.34, 0.91, 1.55, 9.94, 2.11, 7.09, 1.65, 0.29, 0.42, 1.83, 1.75, 0.2, 0.63, 2.58, 1.38, 3.12, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/f7q5ce9Jwgw_filtered.json b/annotations_filtered/f7q5ce9Jwgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/f7q5ce9Jwgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/f7vRR8-n_Rc_filtered.json b/annotations_filtered/f7vRR8-n_Rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654a5a3d8907cfb82a551391f652957d970c378f --- /dev/null +++ b/annotations_filtered/f7vRR8-n_Rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.38], [19.0, 22.62], [23.0, 23.72], [30.0, 32.0], [43.0, 42.92], [44.0, 51.8], [58.0, 59.95], [78.0, 78.68], [81.0, 86.44], [87.0, 86.9], [87.0, 89.94], [96.0, 97.68], [105.0, 105.38], [109.0, 109.17], [117.0, 120.01]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [29.88, 29.3, 0.0, 30.86, 0.0, 29.47, 0.0, 0.0, 29.88, 0.0, 30.11, 0.0, 0.0, 0.0, 29.7], "audiomae_on_audioset": [[["music", 60.41], ["electronic music", 7.9], ["sidetone", 4.01]], [["cattle, bovinae", 42.68], ["moo", 30.86], ["livestock, farm animals, working animals", 17.99]], null, [["music", 26.83], ["hum", 16.44], ["throbbing", 13.51]], null, [["music", 60.69], ["speech", 6.7], ["siren", 3.17]], null, null, [["boing", 46.42], ["music", 36.43], ["speech", 3.07]], null, [["music", 62.3], ["video game music", 5.78], ["clarinet", 2.47]], null, null, null, [["music", 40.47], ["speech", 19.38], ["boom", 8.96]]], "duration": [7.38, 3.62, 0.72, 2.0, -0.08, 7.8, 1.95, 0.68, 5.44, -0.1, 2.94, 1.68, 0.38, 0.17, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/f8-6UgJ6dSo_filtered.json b/annotations_filtered/f8-6UgJ6dSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de342df75d9ccead19319dbdaff5be0cb87a1734 --- /dev/null +++ b/annotations_filtered/f8-6UgJ6dSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [1.0, 0.78], [2.0, 3.45], [5.0, 6.64], [10.0, 10.61], [11.0, 11.42], [12.0, 13.88], [14.0, 15.28], [17.0, 17.86], [20.0, 20.48], [25.0, 25.47], [27.0, 27.84], [28.0, 29.07], [30.0, 30.32], [32.0, 34.6], [35.0, 35.6], [38.0, 38.87], [39.0, 40.36], [42.0, 43.16], [44.0, 44.86], [46.0, 47.09], [49.0, 49.2], [52.0, 54.24], [55.0, 58.73], [59.0, 63.19], [64.0, 65.69], [66.0, 69.3], [69.0, 69.33], [70.0, 69.89], [71.0, 72.05], [74.0, 76.84], [78.0, 78.78], [80.0, 80.43], [81.0, 82.59], [83.0, 84.28], [85.0, 85.8], [86.0, 87.39], [92.0, 92.57], [98.0, 99.23], [100.0, 100.89], [101.0, 102.66], [103.0, 103.52], [104.0, 108.45], [110.0, 121.15], [123.0, 124.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 98.1, 0.0, 65.32, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, -0.22, 1.45, 1.64, 0.61, 0.42, 1.88, 1.28, 0.86, 0.48, 0.47, 0.84, 1.07, 0.32, 2.6, 0.6, 0.87, 1.36, 1.16, 0.86, 1.09, 0.2, 2.24, 3.73, 4.19, 1.69, 3.3, 0.33, -0.11, 1.05, 2.84, 0.78, 0.43, 1.59, 1.28, 0.8, 1.39, 0.57, 1.23, 0.89, 1.66, 0.52, 4.45, 11.15, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/f86_fLGHu6M_filtered.json b/annotations_filtered/f86_fLGHu6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..814d31f90c8cb72d23dab44744705340be017312 --- /dev/null +++ b/annotations_filtered/f86_fLGHu6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 5.0], [8.0, 12.46], [13.0, 12.99], [21.0, 21.86], [27.0, 27.97], [36.0, 36.15], [40.0, 40.09], [50.0, 50.8], [53.0, 53.77], [55.0, 55.26], [60.0, 61.16], [62.0, 63.41], [65.0, 66.02], [71.0, 71.91], [73.0, 74.75], [78.0, 79.29], [87.0, 87.37], [89.0, 95.39], [97.0, 100.63], [101.0, 102.12], [110.0, 110.03], [112.0, 116.28], [119.0, 120.29], [130.0, 131.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 99.98, 0.0, 0.0, 82.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.0, 4.46, -0.01, 0.86, 0.97, 0.15, 0.09, 0.8, 0.77, 0.26, 1.16, 1.41, 1.02, 0.91, 1.75, 1.29, 0.37, 6.39, 3.63, 1.12, 0.03, 4.28, 1.29, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/f890SC1schE_filtered.json b/annotations_filtered/f890SC1schE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e376faecd8055ccb7a0b61b7e4ff0c87bc5a758c --- /dev/null +++ b/annotations_filtered/f890SC1schE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.97], [7.0, 42.85], [45.0, 46.41], [50.0, 63.17], [65.0, 74.04]], "keep_status": [false, false, false, true, false], "silence_prob": [98.51, 0.0, 0.0, 30.87, 70.58], "audiomae_on_audioset": [null, null, null, [["vehicle", 16.04], ["motorcycle", 11.6], ["speech", 5.72]], null], "duration": [2.97, 35.85, 1.41, 13.17, 9.04]} \ No newline at end of file diff --git a/annotations_filtered/f8Cjlv6nBTg_filtered.json b/annotations_filtered/f8Cjlv6nBTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07791f4e4b83469b0a8bb0b3545ecc5d68859d6b --- /dev/null +++ b/annotations_filtered/f8Cjlv6nBTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.91], [36.0, 36.05], [46.0, 50.14], [53.0, 56.59], [61.0, 64.37], [69.0, 75.51], [79.0, 86.16], [98.0, 99.01], [103.0, 105.17], [107.0, 107.03], [108.0, 108.82], [110.0, 111.75], [115.0, 116.41], [117.0, 120.01], [121.0, 122.15], [124.0, 125.27]], "keep_status": [true, false, true, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [37.96, 0.0, 33.0, 45.85, 32.34, 32.77, 34.37, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0], "audiomae_on_audioset": [[["fart", 29.02], ["music", 23.76], ["speech", 12.42]], null, [["speech", 38.77], ["music", 16.92], ["didgeridoo", 10.74]], [["music", 22.75], ["speech", 14.39], ["didgeridoo", 11.51]], [["cattle, bovinae", 32.94], ["moo", 21.2], ["livestock, farm animals, working animals", 14.1]], [["speech", 24.16], ["music", 18.75], ["sidetone", 4.86]], [["speech", 31.96], ["music", 15.6], ["fart", 6.09]], null, null, null, null, null, null, null, null, null], "duration": [4.91, 0.05, 4.14, 3.59, 3.37, 6.51, 7.16, 1.01, 2.17, 0.03, 0.82, 1.75, 1.41, 3.01, 1.15, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/f8P51JbIp9g_filtered.json b/annotations_filtered/f8P51JbIp9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda4d559fe70cbc8cde790417ae16f26797ebf1d --- /dev/null +++ b/annotations_filtered/f8P51JbIp9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.28], [19.0, 75.42], [75.0, 75.96]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.28, 56.42, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/f8_4uckfT8I_filtered.json b/annotations_filtered/f8_4uckfT8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbeae33f418850c047bbe1c843a0643b1bc7252b --- /dev/null +++ b/annotations_filtered/f8_4uckfT8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [4.0, 5.81], [14.0, 15.04], [20.0, 20.82], [29.0, 30.91], [34.0, 35.68], [37.0, 38.8], [40.0, 41.72], [43.0, 43.8], [49.0, 50.4], [51.0, 53.27], [55.0, 55.54], [56.0, 58.92], [63.0, 64.42], [67.0, 70.26], [72.0, 73.9], [77.0, 77.73], [81.0, 82.93], [83.0, 84.48], [86.0, 88.89], [92.0, 94.73], [96.0, 97.61], [99.0, 100.99], [104.0, 105.53], [106.0, 110.47], [111.0, 112.94], [117.0, 118.62], [119.0, 119.74], [122.0, 123.26], [127.0, 127.62], [131.0, 131.33], [133.0, 135.06], [138.0, 138.99], [144.0, 146.08], [147.0, 149.67], [152.0, 154.06], [156.0, 157.86], [162.0, 163.76], [165.0, 165.28], [167.0, 167.64], [169.0, 172.08], [173.0, 173.94], [175.0, 175.9], [177.0, 183.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [63.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 75.88, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 56.55, 97.54, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 59.96, 47.94, 99.97, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 73.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.97], ["frog", 27.15], ["croak", 8.06]], null, null, null, null, null, null, null, null, null], "duration": [2.0, 1.81, 1.04, 0.82, 1.91, 1.68, 1.8, 1.72, 0.8, 1.4, 2.27, 0.54, 2.92, 1.42, 3.26, 1.9, 0.73, 1.93, 1.48, 2.89, 2.73, 1.61, 1.99, 1.53, 4.47, 1.94, 1.62, 0.74, 1.26, 0.62, 0.33, 2.06, 0.99, 2.08, 2.67, 2.06, 1.86, 1.76, 0.28, 0.64, 3.08, 0.94, 0.9, 6.24]} \ No newline at end of file diff --git a/annotations_filtered/f8a97iauRtw_filtered.json b/annotations_filtered/f8a97iauRtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b83a533365787c26ebdda216231682a52a932d19 --- /dev/null +++ b/annotations_filtered/f8a97iauRtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.88], [7.0, 7.15], [8.0, 11.85], [12.0, 14.99], [16.0, 16.56], [17.0, 18.89], [21.0, 21.93], [24.0, 24.44], [25.0, 26.64], [28.0, 28.53], [30.0, 46.82], [48.0, 48.69], [49.0, 50.43], [52.0, 68.55], [70.0, 70.12], [73.0, 87.78], [89.0, 91.35], [92.0, 92.65], [94.0, 95.35], [97.0, 97.88], [99.0, 99.08], [100.0, 100.82], [104.0, 104.7], [106.0, 106.74], [110.0, 112.41], [113.0, 115.2], [116.0, 116.48], [118.0, 118.72], [120.0, 120.01], [123.0, 124.97], [126.0, 127.77], [129.0, 145.56], [147.0, 146.94], [154.0, 154.11], [155.0, 155.97], [157.0, 157.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.17, 0.0, 98.01, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 60.89, 0.0, 98.51, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.88, 0.15, 3.85, 2.99, 0.56, 1.89, 0.93, 0.44, 1.64, 0.53, 16.82, 0.69, 1.43, 16.55, 0.12, 14.78, 2.35, 0.65, 1.35, 0.88, 0.08, 0.82, 0.7, 0.74, 2.41, 2.2, 0.48, 0.72, 0.01, 1.97, 1.77, 16.56, -0.06, 0.11, 0.97, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/f8dkNziRlHg_filtered.json b/annotations_filtered/f8dkNziRlHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94b5980eb6d5590cd63b881b7251f71b903910c1 --- /dev/null +++ b/annotations_filtered/f8dkNziRlHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.49], [11.0, 19.74], [20.0, 42.84], [44.0, 43.97], [48.0, 49.35], [51.0, 51.9], [54.0, 55.85], [59.0, 60.05], [60.0, 65.94], [66.0, 72.01], [72.0, 78.0], [81.0, 83.52], [86.0, 87.78], [88.0, 92.45], [93.0, 98.66], [99.0, 102.41], [111.0, 111.92], [112.0, 116.01], [117.0, 117.44], [117.0, 118.0], [124.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, true, false, true, true, true, false, true, false, false, true], "silence_prob": [72.16, 55.74, 36.31, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 32.91, 30.21, 44.37, 0.0, 38.25, 40.47, 41.56, 0.0, 36.72, 0.0, 0.0, 42.42], "audiomae_on_audioset": [null, null, [["music", 44.71], ["theremin", 22.98], ["hum", 3.82]], null, null, null, null, null, [["speech", 31.85], ["music", 26.14], ["fart", 7.43]], [["music", 48.82], ["speech", 9.1], ["theremin", 8.51]], [["theremin", 65.6], ["music", 21.11], ["musical instrument", 2.52]], [["music", 36.57], ["didgeridoo", 18.87], ["hum", 7.65]], null, [["music", 37.83], ["didgeridoo", 19.62], ["speech", 6.09]], [["music", 43.94], ["didgeridoo", 9.61], ["theremin", 8.22]], [["music", 62.13], ["brass instrument", 3.78], ["musical instrument", 2.54]], null, [["speech", 26.19], ["music", 21.22], ["foghorn", 12.33]], null, null, [["music", 37.39], ["throbbing", 17.2], ["heart sounds, heartbeat", 9.28]]], "duration": [6.49, 8.74, 22.84, -0.03, 1.35, 0.9, 1.85, 1.05, 5.94, 6.01, 6.0, 2.52, 1.78, 4.45, 5.66, 3.41, 0.92, 4.01, 0.44, 1.0, 5.19]} \ No newline at end of file diff --git a/annotations_filtered/f8znwPYsuFE_filtered.json b/annotations_filtered/f8znwPYsuFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05d441d71d7d825351c06992c3d31837ede8516a --- /dev/null +++ b/annotations_filtered/f8znwPYsuFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.86], [12.0, 12.41], [23.0, 24.51], [32.0, 32.81], [35.0, 36.15], [39.0, 41.76], [45.0, 52.59], [53.0, 54.45], [56.0, 57.11], [58.0, 58.19], [60.0, 61.25], [63.0, 64.62], [66.0, 67.44], [68.0, 69.13], [74.0, 75.83], [77.0, 78.6], [80.0, 81.21], [85.0, 85.5], [90.0, 90.42], [103.0, 107.22], [110.0, 111.01]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.82, 42.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 47.66], ["throbbing", 18.98], ["music", 10.81]], [["hum", 27.82], ["speech", 20.12], ["throbbing", 19.85]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.21], ["sonar", 5.72], ["synthesizer", 5.0]], null], "duration": [-0.14, 0.41, 1.51, 0.81, 1.15, 2.76, 7.59, 1.45, 1.11, 0.19, 1.25, 1.62, 1.44, 1.13, 1.83, 1.6, 1.21, 0.5, 0.42, 4.22, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/f96ppJ3DSGE_filtered.json b/annotations_filtered/f96ppJ3DSGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa5330686d4ec74b6fc0f55a541db13f25e77096 --- /dev/null +++ b/annotations_filtered/f96ppJ3DSGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 53.01], [55.0, 67.66], [72.0, 93.39], [94.0, 143.02], [144.0, 148.09], [149.0, 152.05]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 39.24, 32.66, 0.0, 81.71, 89.36], "audiomae_on_audioset": [null, [["music", 47.56], ["hum", 21.63], ["mains hum", 11.45]], [["hum", 22.04], ["music", 14.05], ["burping, eructation", 6.51]], null, null, null], "duration": [33.01, 12.66, 21.39, 49.02, 4.09, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/f9Od8yx9gmg_filtered.json b/annotations_filtered/f9Od8yx9gmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95f657ce81ff9dfa9c340c3b213593178bcf0147 --- /dev/null +++ b/annotations_filtered/f9Od8yx9gmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 41.59], [44.0, 53.03], [54.0, 80.37], [82.0, 85.83], [88.0, 101.9], [104.0, 125.93], [134.0, 151.36], [154.0, 158.45], [161.0, 166.8], [171.0, 170.67], [173.0, 175.74], [179.0, 180.49], [184.0, 194.17]], "keep_status": [true, false, false, true, false, true, false, true, false, false, false, false, true], "silence_prob": [29.05, 29.18, 28.73, 29.13, 28.85, 29.53, 29.13, 32.96, 36.31, 0.0, 30.12, 0.0, 29.62], "audiomae_on_audioset": [[["music", 26.51], ["hum", 23.71], ["speech", 16.45]], [["music", 64.12], ["noise", 7.23], ["speech", 5.76]], [["speech", 44.05], ["music", 32.21], ["buzz", 2.12]], [["explosion", 24.84], ["rumble", 15.01], ["speech", 6.58]], [["music", 40.66], ["mains hum", 19.94], ["hum", 12.82]], [["music", 22.45], ["whack, thwack", 16.52], ["speech", 9.12]], [["throbbing", 53.38], ["hum", 17.23], ["music", 16.41]], [["music", 36.56], ["hum", 14.01], ["mains hum", 7.85]], [["throbbing", 33.58], ["music", 30.02], ["hum", 20.65]], null, [["music", 73.37], ["electronic music", 4.71], ["speech", 2.75]], null, [["music", 57.41], ["hum", 6.96], ["mains hum", 5.59]]], "duration": [27.59, 9.03, 26.37, 3.83, 13.9, 21.93, 17.36, 4.45, 5.8, -0.33, 2.74, 1.49, 10.17]} \ No newline at end of file diff --git a/annotations_filtered/f9Wq05WVXiQ_filtered.json b/annotations_filtered/f9Wq05WVXiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eefd62c4ebbfddead142e324adfd8e0d643ae02 --- /dev/null +++ b/annotations_filtered/f9Wq05WVXiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [7.0, 8.07], [9.0, 8.78], [17.0, 16.95], [18.0, 19.84], [20.0, 20.36], [24.0, 25.83], [27.0, 28.11], [29.0, 40.02], [42.0, 42.03], [43.0, 44.71], [47.0, 48.78], [49.0, 52.62], [54.0, 69.09], [70.0, 158.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 44.46, 59.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 47.39], ["mosquito", 17.37], ["insect", 16.99]], null, null, null, [["speech", 48.4], ["hum", 19.67], ["mains hum", 7.91]], null, null], "duration": [1.97, 1.07, -0.22, -0.05, 1.84, 0.36, 1.83, 1.11, 11.02, 0.03, 1.71, 1.78, 3.62, 15.09, 88.7]} \ No newline at end of file diff --git a/annotations_filtered/f9_akBxA4mU_filtered.json b/annotations_filtered/f9_akBxA4mU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ebe9ee84677c198d95449f021f9dd03be8ab0c9 --- /dev/null +++ b/annotations_filtered/f9_akBxA4mU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.91], [9.0, 9.29], [13.0, 15.23], [16.0, 16.71], [22.0, 23.82], [26.0, 27.57], [31.0, 31.6], [32.0, 33.08], [37.0, 38.11], [39.0, 39.99], [41.0, 41.44], [43.0, 43.98], [48.0, 48.03], [49.0, 50.3], [66.0, 67.39], [72.0, 81.45], [82.0, 82.17], [84.0, 83.78], [88.0, 91.37], [101.0, 104.68]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 37.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 39.63, 64.75], "audiomae_on_audioset": [null, null, [["speech", 26.25], ["fly, housefly", 12.16], ["radio", 9.65]], null, null, null, null, null, null, null, null, null, null, null, null, [["frog", 14.58], ["whale vocalization", 10.86], ["livestock, farm animals, working animals", 9.03]], null, null, [["sidetone", 66.71], ["speech", 19.87], ["radio", 5.61]], null], "duration": [0.91, 0.29, 2.23, 0.71, 1.82, 1.57, 0.6, 1.08, 1.11, 0.99, 0.44, 0.98, 0.03, 1.3, 1.39, 9.45, 0.17, -0.22, 3.37, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/f9vhFEweovc_filtered.json b/annotations_filtered/f9vhFEweovc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b832efd67da2a5eb2b55c0b82a2144bfddaf505 --- /dev/null +++ b/annotations_filtered/f9vhFEweovc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [8.0, 8.6], [11.0, 12.04], [18.0, 18.82], [20.0, 20.12], [23.0, 22.77], [27.0, 27.38], [35.0, 35.36], [38.0, 39.7], [41.0, 41.18], [43.0, 43.38], [78.0, 78.39], [80.0, 81.06], [82.0, 82.41], [84.0, 86.71], [88.0, 88.3], [89.0, 90.71], [93.0, 94.22], [101.0, 101.82], [108.0, 108.7], [110.0, 110.1], [111.0, 110.54], [112.0, 112.83], [114.0, 116.43], [118.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.6, 1.04, 0.82, 0.12, -0.23, 0.38, 0.36, 1.7, 0.18, 0.38, 0.39, 1.06, 0.41, 2.71, 0.3, 1.71, 1.22, 0.82, 0.7, 0.1, -0.46, 0.83, 2.43, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/f9wFKCfic8Q_filtered.json b/annotations_filtered/f9wFKCfic8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e0b983a81a38fa950d797f45450901858a4c57e --- /dev/null +++ b/annotations_filtered/f9wFKCfic8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.59], [11.0, 19.6], [20.0, 25.35], [27.0, 28.39], [29.0, 30.37], [33.0, 59.56], [64.0, 72.47], [76.0, 86.91], [92.0, 95.18]], "keep_status": [false, true, true, false, false, true, false, false, false], "silence_prob": [38.46, 34.2, 32.22, 0.0, 0.0, 31.09, 31.76, 35.24, 35.51], "audiomae_on_audioset": [[["music", 41.56], ["hum", 19.26], ["throbbing", 9.51]], [["livestock, farm animals, working animals", 32.62], ["speech", 14.61], ["cattle, bovinae", 10.16]], [["speech", 33.5], ["music", 32.94], ["electronic music", 3.14]], null, null, [["music", 28.44], ["speech", 16.65], ["livestock, farm animals, working animals", 9.59]], [["music", 41.18], ["speech", 32.05], ["explosion", 6.13]], [["music", 44.23], ["throbbing", 21.7], ["hum", 19.04]], [["speech", 51.17], ["music", 18.92], ["boing", 8.17]]], "duration": [5.59, 8.6, 5.35, 1.39, 1.37, 26.56, 8.47, 10.91, 3.18]} \ No newline at end of file diff --git a/annotations_filtered/fARjlj6q1uU_filtered.json b/annotations_filtered/fARjlj6q1uU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7138b5dee8f53d6b7ed777ccb6d2d664ab45fb7 --- /dev/null +++ b/annotations_filtered/fARjlj6q1uU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.03], [11.0, 12.56], [13.0, 13.69], [16.0, 20.36], [23.0, 28.58], [29.0, 30.08], [31.0, 33.71], [35.0, 35.26], [36.0, 37.17], [42.0, 41.79], [42.0, 42.65], [43.0, 43.26], [45.0, 45.64], [66.0, 73.5], [83.0, 82.68], [85.0, 86.21], [94.0, 93.9], [96.0, 98.39], [99.0, 99.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.76, 0.0, 0.0, 99.48, 99.26, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.26, 0.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.16], ["music", 9.52], ["electric shaver, electric razor", 7.22]], null, null, null, null, null], "duration": [6.03, 1.56, 0.69, 4.36, 5.58, 1.08, 2.71, 0.26, 1.17, -0.21, 0.65, 0.26, 0.64, 7.5, -0.32, 1.21, -0.1, 2.39, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/fAaVf_wel0c_filtered.json b/annotations_filtered/fAaVf_wel0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eda908f7d469aa0d9fdcef67c1fa07d83dfed7d --- /dev/null +++ b/annotations_filtered/fAaVf_wel0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [9.0, 8.58], [13.0, 14.32], [25.0, 27.4], [29.0, 29.0], [37.0, 39.92], [41.0, 42.74], [44.0, 44.66], [47.0, 47.83], [49.0, 49.77], [51.0, 51.04], [55.0, 55.41], [57.0, 56.89], [57.0, 56.93], [57.0, 57.0], [57.0, 57.59], [58.0, 57.81], [58.0, 57.94], [59.0, 59.58], [75.0, 75.41], [85.0, 87.24], [90.0, 93.77], [111.0, 110.64], [113.0, 114.57], [117.0, 118.4], [126.0, 126.23], [128.0, 130.05], [131.0, 133.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 94.81, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.87, 30.44, 0.0, 0.0, 0.0, 0.0, 29.47, 29.17], "audiomae_on_audioset": [null, null, null, null, null, [["music", 66.24], ["musical instrument", 11.32], ["harp", 6.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.26], ["musical instrument", 6.99], ["didgeridoo", 6.73]], [["music", 66.87], ["singing", 2.51], ["synthetic singing", 1.97]], null, null, null, null, [["music", 57.47], ["musical instrument", 4.25], ["didgeridoo", 3.49]], [["music", 52.68], ["theremin", 5.64], ["musical instrument", 4.11]]], "duration": [0.26, -0.42, 1.32, 2.4, 0.0, 2.92, 1.74, 0.66, 0.83, 0.77, 0.04, 0.41, -0.11, -0.07, 0.0, 0.59, -0.19, -0.06, 0.58, 0.41, 2.24, 3.77, -0.36, 1.57, 1.4, 0.23, 2.05, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/fAdsL7AXW6A_filtered.json b/annotations_filtered/fAdsL7AXW6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0eda811c1a6b994e97a7766eac51b33272fce15 --- /dev/null +++ b/annotations_filtered/fAdsL7AXW6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [5.0, 6.0], [7.0, 7.6], [9.0, 10.17], [30.0, 31.53], [32.0, 32.88], [38.0, 39.34], [42.0, 90.34], [91.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.54], ["buzz", 10.57], ["cattle, bovinae", 10.18]]], "duration": [0.83, 1.0, 0.6, 1.17, 1.53, 0.88, 1.34, 48.34, 28.94]} \ No newline at end of file diff --git a/annotations_filtered/fAiJAcgjWeQ_filtered.json b/annotations_filtered/fAiJAcgjWeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5706b119fdebdf9c3356a623b61fe531da9b56 --- /dev/null +++ b/annotations_filtered/fAiJAcgjWeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [15.0, 15.35], [17.0, 19.03], [19.0, 20.97], [22.0, 23.43], [25.0, 25.76], [27.0, 27.6], [29.0, 31.14], [33.0, 33.35], [35.0, 36.1], [36.0, 38.58], [41.0, 41.17], [52.0, 54.38], [55.0, 57.69], [63.0, 63.27], [65.0, 65.35], [67.0, 66.97], [67.0, 67.31], [68.0, 70.17], [73.0, 73.58], [76.0, 76.18], [78.0, 78.33], [79.0, 79.39], [80.0, 80.55], [81.0, 81.5], [87.0, 87.35], [91.0, 92.31], [94.0, 97.48], [98.0, 99.87], [100.0, 106.25], [113.0, 114.29], [116.0, 119.13], [120.0, 122.18], [123.0, 128.63], [129.0, 129.81], [131.0, 131.4], [132.0, 133.25], [134.0, 134.92], [140.0, 141.96], [143.0, 143.63], [146.0, 145.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 86.27, 0.0, 88.46, 95.91, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 87.55, 0.0, 99.16, 98.99, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.35, 2.03, 1.97, 1.43, 0.76, 0.6, 2.14, 0.35, 1.1, 2.58, 0.17, 2.38, 2.69, 0.27, 0.35, -0.03, 0.31, 2.17, 0.58, 0.18, 0.33, 0.39, 0.55, 0.5, 0.35, 1.31, 3.48, 1.87, 6.25, 1.29, 3.13, 2.18, 5.63, 0.81, 0.4, 1.25, 0.92, 1.96, 0.63, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/fB5HTcFhCso_filtered.json b/annotations_filtered/fB5HTcFhCso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b8b98e88d942d4c8f8f93c2038d3818b7f31c26 --- /dev/null +++ b/annotations_filtered/fB5HTcFhCso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [11.0, 11.55], [12.0, 12.56], [18.0, 18.54], [20.0, 20.82], [23.0, 24.24], [31.0, 39.73], [42.0, 43.16], [44.0, 45.6], [50.0, 53.16], [56.0, 59.29], [61.0, 64.91], [66.0, 71.17], [73.0, 88.45], [89.0, 89.73], [90.0, 90.81], [91.0, 92.69], [97.0, 98.95], [102.0, 102.41], [104.0, 107.27], [109.0, 114.66], [115.0, 116.61], [117.0, 118.18], [124.0, 126.0], [128.0, 131.94], [132.0, 133.57], [142.0, 143.61], [148.0, 148.78], [149.0, 150.47], [154.0, 155.46], [156.0, 157.92], [159.0, 160.68], [165.0, 167.34], [168.0, 170.09], [173.0, 175.76], [176.0, 177.2], [178.0, 179.19], [184.0, 185.45]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 42.3, 56.18, 45.65, 42.3, 31.5, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 51.55, 0.0, 0.0, 48.52, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 69.74, 57.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.15], ["hum", 7.67], ["throbbing", 6.32]], null, null, [["cattle, bovinae", 42.3], ["moo", 32.14], ["livestock, farm animals, working animals", 12.26]], null, [["music", 16.22], ["mains hum", 14.85], ["hum", 12.14]], [["whale vocalization", 37.9], ["music", 24.06], ["theremin", 7.26]], [["music", 66.47], ["throbbing", 16.9], ["didgeridoo", 2.71]], null, null, null, null, null, [["music", 25.64], ["hum", 9.0], ["speech", 8.1]], null, null, null, [["speech", 32.17], ["hum", 9.95], ["mains hum", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.55, 0.56, 0.54, 0.82, 1.24, 8.73, 1.16, 1.6, 3.16, 3.29, 3.91, 5.17, 15.45, 0.73, 0.81, 1.69, 1.95, 0.41, 3.27, 5.66, 1.61, 1.18, 2.0, 3.94, 1.57, 1.61, 0.78, 1.47, 1.46, 1.92, 1.68, 2.34, 2.09, 2.76, 1.2, 1.19, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/fB8_lNQJ-JM_filtered.json b/annotations_filtered/fB8_lNQJ-JM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b7a1cbcd5b5b805884e2530f502a1a58ced305 --- /dev/null +++ b/annotations_filtered/fB8_lNQJ-JM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.86], [18.0, 18.23], [18.0, 28.9], [32.0, 31.97], [32.0, 32.53], [36.0, 36.31], [38.0, 39.24], [40.0, 40.76], [43.0, 43.21], [45.0, 45.81], [48.0, 51.95], [62.0, 62.67], [65.0, 65.52], [66.0, 66.48], [67.0, 68.15], [69.0, 69.92], [71.0, 72.33], [75.0, 76.25], [82.0, 82.97], [84.0, 85.8], [88.0, 89.02], [89.0, 89.97], [92.0, 92.89], [94.0, 95.66], [99.0, 99.15], [101.0, 102.69], [104.0, 107.99], [109.0, 110.66], [111.0, 114.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 44.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 47.82], "audiomae_on_audioset": [null, null, [["boat, water vehicle", 33.02], ["speech", 26.9], ["rowboat, canoe, kayak", 20.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 10.73], ["music", 8.25], ["speech", 7.61]]], "duration": [1.86, 0.23, 10.9, -0.03, 0.53, 0.31, 1.24, 0.76, 0.21, 0.81, 3.95, 0.67, 0.52, 0.48, 1.15, 0.92, 1.33, 1.25, 0.97, 1.8, 1.02, 0.97, 0.89, 1.66, 0.15, 1.69, 3.99, 1.66, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/fBB_lJ3Axqk_filtered.json b/annotations_filtered/fBB_lJ3Axqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e60e02f2dca137132b5fecbf4daebf3f7b95466 --- /dev/null +++ b/annotations_filtered/fBB_lJ3Axqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 22.22], [24.0, 38.21], [41.0, 59.04], [60.0, 67.17], [68.0, 68.4], [69.0, 74.09], [74.0, 74.12], [75.0, 77.04], [78.0, 82.26], [83.0, 84.33], [85.0, 85.58], [88.0, 88.5], [91.0, 93.02], [102.0, 113.91], [115.0, 125.56]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [30.6, 31.06, 34.32, 40.22, 0.0, 31.33, 0.0, 33.16, 33.58, 0.0, 0.0, 0.0, 34.55, 32.29, 31.59], "audiomae_on_audioset": [[["music", 73.96], ["musical instrument", 4.43], ["guitar", 1.63]], [["music", 89.35], ["musical instrument", 2.17], ["guitar", 1.48]], [["music", 68.51], ["speech", 10.9], ["neigh, whinny", 5.75]], [["speech", 23.99], ["radio", 13.2], ["music", 9.49]], null, [["music", 69.55], ["musical instrument", 8.26], ["guitar", 5.94]], null, [["music", 76.11], ["guitar", 6.21], ["musical instrument", 4.5]], [["music", 33.38], ["mosquito", 6.56], ["fly, housefly", 5.5]], null, null, null, [["music", 52.52], ["musical instrument", 8.87], ["guitar", 6.51]], [["music", 64.61], ["speech", 8.31], ["musical instrument", 2.2]], [["music", 56.58], ["musical instrument", 8.93], ["plucked string instrument", 4.6]]], "duration": [14.22, 14.21, 18.04, 7.17, 0.4, 5.09, 0.12, 2.04, 4.26, 1.33, 0.58, 0.5, 2.02, 11.91, 10.56]} \ No newline at end of file diff --git a/annotations_filtered/fBNzgfFkvEo_filtered.json b/annotations_filtered/fBNzgfFkvEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a34a374e7e6780da9a131313701a93a14f9a31d --- /dev/null +++ b/annotations_filtered/fBNzgfFkvEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 108.77], [110.0, 147.78]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [58.77, 37.78]} \ No newline at end of file diff --git a/annotations_filtered/fBTODK66ymw_filtered.json b/annotations_filtered/fBTODK66ymw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7f6766c4794f78be559b108f93e6a8734f66c05 --- /dev/null +++ b/annotations_filtered/fBTODK66ymw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [6.0, 7.35], [10.0, 15.65], [17.0, 63.05], [67.0, 73.63], [76.0, 81.55], [83.0, 85.31], [89.0, 106.0], [111.0, 111.91], [113.0, 115.25], [117.0, 118.44], [119.0, 119.79], [120.0, 121.29], [122.0, 134.67], [135.0, 149.55], [153.0, 153.54], [154.0, 153.62], [154.0, 154.74], [157.0, 157.05], [161.0, 160.83], [164.0, 164.81], [170.0, 183.78], [185.0, 186.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.64, 0.0, 30.09, 30.04, 31.37, 28.78, 0.0, 29.08, 0.0, 0.0, 0.0, 28.64, 29.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.15, 0.0], "audiomae_on_audioset": [null, null, [["buzz", 26.54], ["electric shaver, electric razor", 15.6], ["hum", 13.94]], null, [["throbbing", 54.53], ["music", 20.72], ["hum", 15.67]], [["hum", 42.97], ["throbbing", 26.99], ["mains hum", 18.21]], [["music", 44.37], ["throbbing", 18.72], ["hum", 10.08]], [["music", 71.55], ["buzz", 3.53], ["cacophony", 2.91]], null, [["electric shaver, electric razor", 38.33], ["music", 24.27], ["mains hum", 9.4]], null, null, null, [["music", 26.71], ["buzz", 16.99], ["hum", 15.83]], [["music", 29.35], ["hum", 23.21], ["mains hum", 21.07]], null, null, null, null, null, null, [["mains hum", 33.89], ["hum", 27.65], ["music", 19.9]], null], "duration": [0.37, 1.35, 5.65, 46.05, 6.63, 5.55, 2.31, 17.0, 0.91, 2.25, 1.44, 0.79, 1.29, 12.67, 14.55, 0.54, -0.38, 0.74, 0.05, -0.17, 0.81, 13.78, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/fBXXvn4s-74_filtered.json b/annotations_filtered/fBXXvn4s-74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cc97b6e1a1dee6edc0ce0dc4d00b6777510852c --- /dev/null +++ b/annotations_filtered/fBXXvn4s-74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.49], [34.0, 34.7], [37.0, 37.86], [52.0, 51.97], [86.0, 86.32], [98.0, 98.15], [110.0, 112.35], [120.0, 120.56], [136.0, 136.75], [143.0, 142.86], [145.0, 146.1], [149.0, 148.8], [153.0, 153.91], [175.0, 176.15], [207.0, 209.22], [213.0, 216.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.49, 0.7, 0.86, -0.03, 0.32, 0.15, 2.35, 0.56, 0.75, -0.14, 1.1, -0.2, 0.91, 1.15, 2.22, 3.57]} \ No newline at end of file diff --git a/annotations_filtered/fB_fwuJOx7I_filtered.json b/annotations_filtered/fB_fwuJOx7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b82114dcc07741991bf311b69fb2c4680a1a3b60 --- /dev/null +++ b/annotations_filtered/fB_fwuJOx7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.02], [28.0, 40.53], [41.0, 41.88], [43.0, 45.77], [47.0, 48.14], [49.0, 49.42], [53.0, 54.06], [55.0, 56.12], [57.0, 58.72], [60.0, 65.08], [66.0, 68.5], [70.0, 70.43], [71.0, 71.64], [74.0, 79.56], [84.0, 87.86], [88.0, 88.92], [90.0, 94.51], [100.0, 100.35], [102.0, 101.98], [103.0, 105.31], [107.0, 107.08], [109.0, 121.12]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.65, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 99.73, 0.0, 0.0, 88.28, 29.92, 0.0, 52.39, 0.0, 0.0, 95.91, 0.0, 38.84], "audiomae_on_audioset": [null, [["music", 18.16], ["thunk", 11.38], ["speech", 10.65]], null, null, null, null, null, null, null, null, null, null, null, null, [["clang", 45.4], ["music", 17.06], ["ding", 16.73]], null, null, null, null, null, null, [["music", 77.98], ["hip hop music", 2.57], ["dubstep", 2.34]]], "duration": [1.02, 12.53, 0.88, 2.77, 1.14, 0.42, 1.06, 1.12, 1.72, 5.08, 2.5, 0.43, 0.64, 5.56, 3.86, 0.92, 4.51, 0.35, -0.02, 2.31, 0.08, 12.12]} \ No newline at end of file diff --git a/annotations_filtered/fBaXUdPo_2g_filtered.json b/annotations_filtered/fBaXUdPo_2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4473584b1a5cdcce244f866c978c67047b297218 --- /dev/null +++ b/annotations_filtered/fBaXUdPo_2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.54], [6.0, 9.63], [13.0, 14.84], [18.0, 19.94], [21.0, 24.27], [25.0, 26.89], [28.0, 29.05], [30.0, 33.34], [34.0, 38.11], [42.0, 42.45], [44.0, 47.98], [50.0, 53.86], [54.0, 57.72], [62.0, 63.09], [65.0, 65.87], [67.0, 68.23], [71.0, 74.82], [77.0, 79.64], [81.0, 86.1], [88.0, 91.74], [93.0, 96.21]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true, false], "silence_prob": [59.96, 53.97, 0.0, 0.0, 75.07, 0.0, 0.0, 39.75, 68.02, 0.0, 56.03, 48.27, 47.66, 0.0, 0.0, 0.0, 51.18, 55.67, 53.1, 43.28, 48.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 23.6], ["glass", 10.21], ["hum", 8.25]], null, null, null, [["hum", 32.59], ["speech", 19.54], ["rumble", 15.34]], [["speech", 24.74], ["hum", 13.61], ["music", 8.57]], null, null, null, null, null, null, [["hum", 30.76], ["music", 26.12], ["throbbing", 10.81]], [["mains hum", 38.25], ["hum", 24.39], ["gong", 9.25]]], "duration": [2.54, 3.63, 1.84, 1.94, 3.27, 1.89, 1.05, 3.34, 4.11, 0.45, 3.98, 3.86, 3.72, 1.09, 0.87, 1.23, 3.82, 2.64, 5.1, 3.74, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/fBlAMqoJ5BA_filtered.json b/annotations_filtered/fBlAMqoJ5BA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4feb0ef30d05a3d1b1bff5b576bc0a030e50081 --- /dev/null +++ b/annotations_filtered/fBlAMqoJ5BA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.86], [12.0, 15.25], [16.0, 16.43], [17.0, 18.74], [20.0, 20.9], [24.0, 24.34], [27.0, 27.55], [29.0, 30.91], [33.0, 34.47], [36.0, 37.08], [42.0, 43.06], [45.0, 45.54], [48.0, 48.15], [55.0, 57.03], [61.0, 62.4], [69.0, 73.9], [76.0, 78.06], [79.0, 87.74], [93.0, 92.87], [99.0, 99.15], [111.0, 111.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false], "silence_prob": [34.53, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.95, 0.0, 31.54, 33.66, 30.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 43.62], ["cattle, bovinae", 29.04], ["moo", 26.16]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 20.37], ["busy signal", 14.78], ["music", 8.51]], null, [["sine wave", 47.42], ["chirp tone", 23.51], ["speech", 9.19]], [["wild animals", 34.06], ["roaring cats (lions, tigers)", 22.56], ["animal", 13.25]], [["speech", 53.05], ["livestock, farm animals, working animals", 6.31], ["sheep", 4.53]], null, null, null], "duration": [6.86, 3.25, 0.43, 1.74, 0.9, 0.34, 0.55, 1.91, 1.47, 1.08, 1.06, 0.54, 0.15, 2.03, 1.4, 4.9, 2.06, 8.74, -0.13, 0.15, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/fBpNFLngzT4_filtered.json b/annotations_filtered/fBpNFLngzT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc3c80b9452615ab118d6bff9d469a6e8bc73231 --- /dev/null +++ b/annotations_filtered/fBpNFLngzT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [7.0, 8.14], [10.0, 13.98], [18.0, 18.66], [20.0, 20.49], [23.0, 27.94], [29.0, 45.4], [48.0, 64.44], [65.0, 65.52], [68.0, 77.58], [83.0, 82.78], [83.0, 83.39], [84.0, 86.14], [87.0, 87.13], [90.0, 96.23], [105.0, 106.51], [108.0, 108.28], [113.0, 116.88], [117.0, 117.59], [127.0, 129.05], [131.0, 130.94]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [61.97, 0.0, 38.93, 0.0, 0.0, 33.67, 33.36, 33.33, 0.0, 37.53, 0.0, 0.0, 33.92, 0.0, 33.28, 0.0, 0.0, 34.96, 0.0, 34.39, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.0], ["speech", 13.17], ["hum", 7.43]], null, null, [["speech", 63.91], ["throbbing", 3.74], ["fart", 3.45]], [["speech", 62.22], ["music", 9.92], ["hum", 5.29]], [["music", 20.08], ["hum", 15.62], ["throbbing", 11.94]], null, [["music", 72.25], ["musical instrument", 3.86], ["speech", 2.94]], null, null, [["music", 69.12], ["boing", 8.06], ["musical instrument", 2.59]], null, [["boing", 42.29], ["music", 32.03], ["speech", 3.26]], null, null, [["music", 69.28], ["musical instrument", 6.64], ["saxophone", 4.1]], null, [["music", 42.1], ["boing", 12.44], ["musical instrument", 4.41]], null], "duration": [2.02, 1.14, 3.98, 0.66, 0.49, 4.94, 16.4, 16.44, 0.52, 9.58, -0.22, 0.39, 2.14, 0.13, 6.23, 1.51, 0.28, 3.88, 0.59, 2.05, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/fBtPMUJJEg8_filtered.json b/annotations_filtered/fBtPMUJJEg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbcbc751e80991ff8bd3c93b98fea32094f2627f --- /dev/null +++ b/annotations_filtered/fBtPMUJJEg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 92.94], [93.0, 108.87], [112.0, 123.75]], "keep_status": [false, false, true], "silence_prob": [68.54, 76.53, 31.73], "audiomae_on_audioset": [null, null, [["music", 21.72], ["vehicle", 6.63], ["sound effect", 5.63]]], "duration": [24.94, 15.87, 11.75]} \ No newline at end of file diff --git a/annotations_filtered/fC1zzL9DjdU_filtered.json b/annotations_filtered/fC1zzL9DjdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c4c80bf4e9da3e13158ba73fa0711393d226ef9 --- /dev/null +++ b/annotations_filtered/fC1zzL9DjdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.41], [18.0, 19.68], [24.0, 24.54], [39.0, 39.07], [48.0, 49.23], [50.0, 51.93], [56.0, 57.43], [58.0, 57.97], [58.0, 59.66], [61.0, 61.89], [65.0, 65.69], [68.0, 68.67], [70.0, 73.55], [80.0, 81.58], [83.0, 84.21], [87.0, 87.88], [89.0, 89.02], [89.0, 90.1], [96.0, 100.18], [101.0, 103.3], [105.0, 108.48], [112.0, 117.63], [118.0, 124.8], [135.0, 135.68], [137.0, 138.3], [140.0, 145.1], [154.0, 153.82], [154.0, 155.26], [156.0, 160.56], [165.0, 165.57], [168.0, 168.88], [172.0, 173.77], [176.0, 176.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 81.71, 74.44, 52.1, 87.92, 0.0, 0.0, 83.52, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 1.68, 0.54, 0.07, 1.23, 1.93, 1.43, -0.03, 1.66, 0.89, 0.69, 0.67, 3.55, 1.58, 1.21, 0.88, 0.02, 1.1, 4.18, 2.3, 3.48, 5.63, 6.8, 0.68, 1.3, 5.1, -0.18, 1.26, 4.56, 0.57, 0.88, 1.77, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/fC976fuQm4E_filtered.json b/annotations_filtered/fC976fuQm4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d1f906a4429e5081c94447b81d15af73c502625 --- /dev/null +++ b/annotations_filtered/fC976fuQm4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [7.0, 7.15], [12.0, 14.69], [20.0, 23.36], [25.0, 32.46], [36.0, 50.31], [54.0, 61.52], [63.0, 67.29], [69.0, 71.36], [74.0, 79.24], [82.0, 81.78], [87.0, 97.09], [99.0, 99.5], [100.0, 102.0], [103.0, 106.91], [107.0, 109.21], [114.0, 116.99], [121.0, 120.99], [123.0, 125.85], [130.0, 131.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 30.69, 30.61, 30.56, 30.65, 30.15, 29.99, 34.09, 31.11, 0.0, 31.27, 0.0, 31.58, 32.3, 30.24, 31.87, 0.0, 38.38, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.5], ["sidetone", 18.64], ["speech", 13.94]], [["music", 55.36], ["throbbing", 19.37], ["hum", 6.2]], [["music", 78.42], ["throbbing", 10.84], ["hum", 4.61]], [["music", 78.81], ["buzz", 2.89], ["musical instrument", 1.92]], [["music", 75.57], ["hum", 7.32], ["throbbing", 5.86]], [["music", 83.02], ["synthesizer", 3.38], ["musical instrument", 3.35]], [["music", 48.96], ["speech", 9.21], ["electronic music", 6.09]], [["music", 39.15], ["throbbing", 33.16], ["hum", 20.31]], null, [["throbbing", 43.42], ["music", 32.69], ["hum", 13.18]], null, [["music", 71.49], ["musical instrument", 3.93], ["speech", 2.48]], [["music", 58.34], ["speech", 6.83], ["sidetone", 6.41]], [["music", 67.4], ["hum", 11.57], ["throbbing", 3.67]], [["music", 40.63], ["domestic animals, pets", 4.96], ["angry music", 4.47]], null, [["music", 39.17], ["hum", 21.37], ["mains hum", 16.45]], null], "duration": [0.86, 0.15, 2.69, 3.36, 7.46, 14.31, 7.52, 4.29, 2.36, 5.24, -0.22, 10.09, 0.5, 2.0, 3.91, 2.21, 2.99, -0.01, 2.85, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/fCNsIYsWjXo_filtered.json b/annotations_filtered/fCNsIYsWjXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baf4b2d001cce142a26aa77f6e0c0bcf14047160 --- /dev/null +++ b/annotations_filtered/fCNsIYsWjXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.63], [22.0, 23.03], [24.0, 24.71], [26.0, 26.6], [27.0, 27.46], [30.0, 30.27], [31.0, 31.51], [33.0, 33.84], [35.0, 35.56], [36.0, 37.76], [42.0, 42.99], [45.0, 45.82], [51.0, 51.7], [53.0, 53.38], [56.0, 56.03], [57.0, 56.94], [58.0, 58.77], [67.0, 66.9], [69.0, 69.18], [70.0, 69.97], [71.0, 71.09], [73.0, 73.75], [76.0, 76.54], [82.0, 82.31], [83.0, 83.39], [85.0, 85.94], [86.0, 87.56], [88.0, 89.16], [90.0, 90.96], [97.0, 97.82], [100.0, 99.79], [100.0, 101.66], [106.0, 106.68], [108.0, 109.27], [111.0, 113.04], [114.0, 115.87], [117.0, 118.94], [123.0, 123.48]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.02], ["speech", 11.08], ["hum", 8.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.77], ["cattle, bovinae", 9.87], ["moo", 6.28]], null, null, null], "duration": [15.63, 1.03, 0.71, 0.6, 0.46, 0.27, 0.51, 0.84, 0.56, 1.76, 0.99, 0.82, 0.7, 0.38, 0.03, -0.06, 0.77, -0.1, 0.18, -0.03, 0.09, 0.75, 0.54, 0.31, 0.39, 0.94, 1.56, 1.16, 0.96, 0.82, -0.21, 1.66, 0.68, 1.27, 2.04, 1.87, 1.94, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/fCQb93-RrZo_filtered.json b/annotations_filtered/fCQb93-RrZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..893cc85e2703274478a4b44ff64b557590185ef3 --- /dev/null +++ b/annotations_filtered/fCQb93-RrZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.41], [10.0, 10.61], [12.0, 15.52], [17.0, 21.83], [23.0, 29.51], [30.0, 48.64], [50.0, 50.04], [50.0, 56.29], [59.0, 64.32], [64.0, 64.39], [64.0, 64.44], [65.0, 64.57], [65.0, 67.02], [69.0, 69.13], [70.0, 70.21], [71.0, 74.11], [76.0, 76.6], [77.0, 81.48], [82.0, 84.55], [88.0, 92.45], [97.0, 101.46], [103.0, 104.65], [106.0, 107.23], [108.0, 108.85], [111.0, 114.37], [115.0, 122.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.52, 99.99, 54.5, 100.0, 0.0, 89.01, 56.78, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 78.38, 0.0, 94.52, 84.25, 31.8, 34.73, 0.0, 0.0, 0.0, 99.93, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 35.71], ["music", 35.64], ["speech", 7.11]], [["music", 38.73], ["synthesizer", 15.27], ["musical instrument", 10.59]], null, null, null, null, null], "duration": [0.41, 0.61, 3.52, 4.83, 6.51, 18.64, 0.04, 6.29, 5.32, 0.39, 0.44, -0.43, 2.02, 0.13, 0.21, 3.11, 0.6, 4.48, 2.55, 4.45, 4.46, 1.65, 1.23, 0.85, 3.37, 7.96]} \ No newline at end of file diff --git a/annotations_filtered/fCbf4DjlHuM_filtered.json b/annotations_filtered/fCbf4DjlHuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b17358b7b8c695be3996d36d8a98d46a6196daa5 --- /dev/null +++ b/annotations_filtered/fCbf4DjlHuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.1], [10.0, 10.67], [13.0, 13.83], [17.0, 21.07], [28.0, 29.74], [30.0, 31.33], [35.0, 36.32], [40.0, 40.74], [44.0, 49.72], [52.0, 53.77], [55.0, 57.42], [59.0, 59.85], [61.0, 62.46], [64.0, 64.52], [71.0, 71.29], [71.0, 72.93], [75.0, 75.49], [78.0, 79.73], [81.0, 87.25], [93.0, 92.97], [93.0, 94.32], [96.0, 97.23], [98.0, 98.78], [100.0, 100.38], [101.0, 102.79], [105.0, 106.44], [108.0, 107.77], [109.0, 110.73], [111.0, 116.41], [118.0, 118.94], [122.0, 122.88], [124.0, 125.27], [127.0, 128.53], [129.0, 130.22], [131.0, 132.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 55.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["frog", 54.23], ["croak", 26.39], ["insect", 10.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.84], ["insect", 14.25], ["buzz", 9.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.67, 0.83, 4.07, 1.74, 1.33, 1.32, 0.74, 5.72, 1.77, 2.42, 0.85, 1.46, 0.52, 0.29, 1.93, 0.49, 1.73, 6.25, -0.03, 1.32, 1.23, 0.78, 0.38, 1.79, 1.44, -0.23, 1.73, 5.41, 0.94, 0.88, 1.27, 1.53, 1.22, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/fCjsUxbNmIs_filtered.json b/annotations_filtered/fCjsUxbNmIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58852b82cd454dd1b21be1a278d7bd83b4867efb --- /dev/null +++ b/annotations_filtered/fCjsUxbNmIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.46], [21.0, 23.41], [26.0, 27.13], [28.0, 28.56], [31.0, 32.37], [33.0, 33.47], [34.0, 33.52], [36.0, 41.28], [42.0, 43.65], [45.0, 61.65], [63.0, 64.57], [68.0, 71.19], [73.0, 73.52], [74.0, 76.25], [77.0, 77.62], [79.0, 80.1], [85.0, 85.14], [94.0, 94.49], [100.0, 107.3], [110.0, 110.83], [112.0, 112.38], [115.0, 117.93], [123.0, 127.33], [128.0, 132.85], [135.0, 137.56], [138.0, 141.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true, true, true], "silence_prob": [0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 33.32, 0.0, 45.05, 0.0, 35.06, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0, 0.0, 42.53, 33.29, 30.66, 29.78, 42.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["mains hum", 35.28], ["hum", 21.42], ["music", 14.51]], null, [["music", 29.24], ["fart", 7.04], ["musical instrument", 5.37]], null, [["insect", 30.8], ["fly, housefly", 27.04], ["speech", 13.1]], null, null, null, null, [["music", 53.86], ["didgeridoo", 4.49], ["electronic music", 3.45]], null, null, [["speech", 49.25], ["music", 20.47], ["hum", 4.14]], [["music", 54.72], ["synthesizer", 8.41], ["hum", 6.41]], [["music", 40.97], ["hum", 14.35], ["mains hum", 6.05]], [["music", 17.95], ["reverberation", 15.23], ["cacophony", 8.22]], [["music", 26.03], ["synthesizer", 7.61], ["hum", 6.82]]], "duration": [1.46, 2.41, 1.13, 0.56, 1.37, 0.47, -0.48, 5.28, 1.65, 16.65, 1.57, 3.19, 0.52, 2.25, 0.62, 1.1, 0.14, 0.49, 7.3, 0.83, 0.38, 2.93, 4.33, 4.85, 2.56, 3.29]} \ No newline at end of file diff --git a/annotations_filtered/fCuS78YHrOY_filtered.json b/annotations_filtered/fCuS78YHrOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4db33c63d7de004ff27f50d0f63eff4a28c0400a --- /dev/null +++ b/annotations_filtered/fCuS78YHrOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [5.0, 5.81], [6.0, 8.65], [11.0, 11.67], [15.0, 16.61], [17.0, 20.53], [21.0, 22.18], [24.0, 29.52], [33.0, 36.22], [38.0, 40.95], [42.0, 42.85], [43.0, 44.12], [45.0, 46.85], [48.0, 48.49], [52.0, 56.0], [57.0, 58.73], [60.0, 60.79], [61.0, 62.67], [64.0, 64.93], [67.0, 67.96], [76.0, 77.25], [84.0, 89.78], [93.0, 119.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 97.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.81, 2.65, 0.67, 1.61, 3.53, 1.18, 5.52, 3.22, 2.95, 0.85, 1.12, 1.85, 0.49, 4.0, 1.73, 0.79, 1.67, 0.93, 0.96, 1.25, 5.78, 26.16]} \ No newline at end of file diff --git a/annotations_filtered/fDcZoI_wy_w_filtered.json b/annotations_filtered/fDcZoI_wy_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..169b89fd874c8f7022b44956eca8db838bac2485 --- /dev/null +++ b/annotations_filtered/fDcZoI_wy_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[91.0, 110.42], [111.0, 111.59], [113.0, 113.88], [117.0, 129.44]], "keep_status": [false, false, false, true], "silence_prob": [33.41, 0.0, 0.0, 32.2], "audiomae_on_audioset": [[["music", 74.51], ["glass", 5.73], ["smash, crash", 5.25]], null, null, [["mains hum", 21.2], ["hum", 20.6], ["noise", 14.92]]], "duration": [19.42, 0.59, 0.88, 12.44]} \ No newline at end of file diff --git a/annotations_filtered/fDeQjTPTlDE_filtered.json b/annotations_filtered/fDeQjTPTlDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42cba589f3cb07c8a4103e5b12a1431aa97b2987 --- /dev/null +++ b/annotations_filtered/fDeQjTPTlDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.4], [12.0, 12.36], [18.0, 18.03], [24.0, 24.17], [28.0, 31.89], [38.0, 38.48], [40.0, 40.05], [40.0, 40.83], [45.0, 45.45], [50.0, 51.93], [54.0, 57.05], [68.0, 68.08], [71.0, 72.44], [80.0, 80.16], [81.0, 82.16], [88.0, 89.01], [91.0, 91.29], [92.0, 92.85], [94.0, 94.53], [100.0, 100.65], [105.0, 105.56], [114.0, 113.63], [121.0, 121.85], [133.0, 133.1], [138.0, 139.11], [146.0, 158.6], [160.0, 160.79], [162.0, 165.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.62, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 0.0, 42.69], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 27.03], ["livestock, farm animals, working animals", 25.57], ["animal", 18.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.47], ["speech", 20.12], ["hum", 12.83]], null, [["speech", 51.03], ["hum", 15.11], ["music", 5.07]]], "duration": [0.4, 0.36, 0.03, 0.17, 3.89, 0.48, 0.05, 0.83, 0.45, 1.93, 3.05, 0.08, 1.44, 0.16, 1.16, 1.01, 0.29, 0.85, 0.53, 0.65, 0.56, -0.37, 0.85, 0.1, 1.11, 12.6, 0.79, 3.75]} \ No newline at end of file diff --git a/annotations_filtered/fDx628jn1YI_filtered.json b/annotations_filtered/fDx628jn1YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514f3ca017fab2ff9037848cf4a7594578d80bcf --- /dev/null +++ b/annotations_filtered/fDx628jn1YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.4], [22.0, 26.92], [36.0, 42.63], [82.0, 81.92], [91.0, 92.1], [95.0, 95.2], [99.0, 99.45]], "keep_status": [false, true, true, false, false, false, false], "silence_prob": [0.0, 30.34, 30.28, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.7], ["groan", 14.44], ["crowd", 10.5]], [["livestock, farm animals, working animals", 12.59], ["speech", 12.33], ["music", 5.4]], null, null, null, null], "duration": [0.4, 4.92, 6.63, -0.08, 1.1, 0.2, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/fEA9BJfaaYA_filtered.json b/annotations_filtered/fEA9BJfaaYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58d20bcd81a2a222ac6eb18f5d3733e4f0c367b3 --- /dev/null +++ b/annotations_filtered/fEA9BJfaaYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 62.88], [64.0, 69.47], [70.0, 71.04], [72.0, 80.16], [83.0, 98.96], [99.0, 162.87], [173.0, 174.75], [176.0, 177.9]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [36.48, 99.98, 0.0, 79.94, 54.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.53], ["groan", 9.07], ["music", 7.23]], null, null, null, null, null, null, null], "duration": [14.88, 5.47, 1.04, 8.16, 15.96, 63.87, 1.75, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/fEEj6d3GTOU_filtered.json b/annotations_filtered/fEEj6d3GTOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef26d6bd09080f22a04b64c8667cdd5f711b82e0 --- /dev/null +++ b/annotations_filtered/fEEj6d3GTOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.18], [7.0, 7.43], [10.0, 13.76], [15.0, 17.2], [18.0, 18.23], [19.0, 19.16], [21.0, 21.14], [22.0, 23.82], [26.0, 26.37], [29.0, 29.71], [34.0, 40.0], [41.0, 41.5], [42.0, 44.0], [48.0, 48.37], [49.0, 50.79], [54.0, 54.8], [58.0, 59.75], [65.0, 65.97], [73.0, 74.53], [77.0, 76.99], [78.0, 78.31], [79.0, 82.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.0, 79.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.39], ["boing", 9.46], ["radio", 3.59]]], "duration": [0.18, 0.43, 3.76, 2.2, 0.23, 0.16, 0.14, 1.82, 0.37, 0.71, 6.0, 0.5, 2.0, 0.37, 1.79, 0.8, 1.75, 0.97, 1.53, -0.01, 0.31, 3.7]} \ No newline at end of file diff --git a/annotations_filtered/fEZuzz0KmN0_filtered.json b/annotations_filtered/fEZuzz0KmN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d2cbbd463696b872f45d0ae3812ecaa65c1a529 --- /dev/null +++ b/annotations_filtered/fEZuzz0KmN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [4.0, 6.08], [9.0, 11.48], [20.0, 21.88], [27.0, 28.22], [32.0, 32.43], [33.0, 33.56], [42.0, 43.23], [44.0, 44.15], [45.0, 45.39], [47.0, 47.61], [49.0, 49.47], [50.0, 52.35], [54.0, 54.99], [56.0, 56.25], [57.0, 58.38], [59.0, 60.32], [71.0, 72.42], [85.0, 86.1], [95.0, 95.5], [96.0, 96.03], [98.0, 98.51], [100.0, 100.08], [101.0, 102.22], [105.0, 105.16], [105.0, 105.58], [107.0, 107.32], [108.0, 108.11], [110.0, 110.0], [112.0, 113.09], [114.0, 114.72], [116.0, 116.33], [122.0, 122.2], [126.0, 126.82], [128.0, 129.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 2.08, 2.48, 1.88, 1.22, 0.43, 0.56, 1.23, 0.15, 0.39, 0.61, 0.47, 2.35, 0.99, 0.25, 1.38, 1.32, 1.42, 1.1, 0.5, 0.03, 0.51, 0.08, 1.22, 0.16, 0.58, 0.32, 0.11, 0.0, 1.09, 0.72, 0.33, 0.2, 0.82, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/fEcClEBT6QU_filtered.json b/annotations_filtered/fEcClEBT6QU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..306e979f89ea7cec91541b804d8b451d88b68131 --- /dev/null +++ b/annotations_filtered/fEcClEBT6QU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [6.0, 11.13], [17.0, 28.95], [30.0, 30.62], [33.0, 45.94], [49.0, 52.32], [62.0, 65.28], [67.0, 67.32], [72.0, 73.82], [74.0, 75.71], [78.0, 85.43], [87.0, 88.52], [89.0, 91.49], [92.0, 92.72], [95.0, 101.85], [102.0, 107.79], [108.0, 110.51], [113.0, 117.64], [121.0, 125.34], [128.0, 132.27], [134.0, 138.23], [143.0, 145.02], [150.0, 157.17], [163.0, 168.45], [171.0, 173.52], [176.0, 177.03]], "keep_status": [false, true, false, false, true, true, true, false, false, false, true, false, true, false, false, true, true, true, true, false, false, true, false, false, true, false], "silence_prob": [0.0, 30.9, 30.58, 0.0, 30.44, 30.73, 30.98, 0.0, 0.0, 0.0, 31.05, 0.0, 31.39, 0.0, 30.69, 30.83, 31.16, 32.5, 33.82, 33.99, 33.07, 32.21, 31.84, 39.11, 37.02, 0.0], "audiomae_on_audioset": [null, [["music", 38.59], ["speech", 19.01], ["foghorn", 7.18]], [["music", 44.56], ["speech", 33.54], ["quack", 1.77]], null, [["speech", 36.49], ["vehicle", 16.94], ["boat, water vehicle", 7.38]], [["speech", 28.47], ["music", 24.47], ["groan", 2.23]], [["speech", 29.42], ["music", 13.0], ["whale vocalization", 8.74]], null, null, null, [["music", 35.51], ["groan", 8.31], ["speech", 5.15]], null, [["music", 17.07], ["gong", 11.68], ["sound effect", 7.81]], null, [["speech", 65.65], ["music", 9.54], ["sidetone", 3.54]], [["music", 37.86], ["speech", 22.92], ["sound effect", 7.24]], [["speech", 38.78], ["mains hum", 10.83], ["hum", 7.69]], [["speech", 45.65], ["boat, water vehicle", 11.13], ["rowboat, canoe, kayak", 6.55]], [["speech", 38.33], ["music", 23.0], ["synthesizer", 2.87]], [["music", 43.03], ["fart", 25.31], ["speech", 4.27]], [["music", 67.6], ["speech", 9.77], ["whack, thwack", 3.47]], [["speech", 39.79], ["music", 17.73], ["musical instrument", 3.46]], [["music", 52.71], ["speech", 13.57], ["laughter", 5.57]], [["music", 51.92], ["throbbing", 16.49], ["hum", 6.04]], [["music", 20.58], ["cattle, bovinae", 15.79], ["speech", 12.85]], null], "duration": [0.95, 5.13, 11.95, 0.62, 12.94, 3.32, 3.28, 0.32, 1.82, 1.71, 7.43, 1.52, 2.49, 0.72, 6.85, 5.79, 2.51, 4.64, 4.34, 4.27, 4.23, 2.02, 7.17, 5.45, 2.52, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/fEocj1eLsmg_filtered.json b/annotations_filtered/fEocj1eLsmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d84320a9b971edce350e29a223bd348fcad09ab6 --- /dev/null +++ b/annotations_filtered/fEocj1eLsmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.87], [5.0, 6.54], [11.0, 12.34], [15.0, 15.79], [17.0, 18.2], [22.0, 22.67], [25.0, 26.25], [30.0, 31.89], [33.0, 32.98], [33.0, 33.54], [37.0, 37.69], [43.0, 49.25], [51.0, 51.09], [52.0, 102.9], [104.0, 109.68], [113.0, 113.78], [115.0, 117.02], [117.0, 123.87], [125.0, 126.47], [127.0, 126.99], [128.0, 129.14], [134.0, 135.55], [139.0, 138.89], [142.0, 142.99], [149.0, 150.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 0.0, 32.52, 0.0, 35.48, 31.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.41], ["cowbell", 24.37], ["livestock, farm animals, working animals", 19.08]], null, [["cattle, bovinae", 47.2], ["moo", 30.82], ["livestock, farm animals, working animals", 19.85]], [["music", 37.35], ["boing", 12.0], ["groan", 6.08]], null, null, null, null, null, null, null], "duration": [0.87, 1.54, 1.34, 0.79, 1.2, 0.67, 1.25, 1.89, -0.02, 0.54, 0.69, 6.25, 0.09, 50.9, 5.68, 0.78, 2.02, 6.87, 1.47, -0.01, 1.14, 1.55, -0.11, 0.99, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/fEpjHtkttYg_filtered.json b/annotations_filtered/fEpjHtkttYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..274a11ada300ec6d66f246213dad35bbbd1f548b --- /dev/null +++ b/annotations_filtered/fEpjHtkttYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.29], [7.0, 13.22], [16.0, 18.23], [20.0, 21.24], [23.0, 23.63], [25.0, 26.3], [28.0, 28.34], [29.0, 30.03], [31.0, 33.94], [35.0, 39.26], [41.0, 46.04], [47.0, 48.83], [50.0, 51.21], [52.0, 54.24], [55.0, 70.77], [71.0, 73.14], [74.0, 118.66], [121.0, 124.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 86.09, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 84.98, 69.88, 0.0, 0.0, 74.76, 33.87, 45.78, 0.0, 49.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.03], ["music", 15.55], ["cacophony", 6.67]], [["speech", 20.35], ["music", 19.33], ["hum", 15.1]], null, [["whale vocalization", 62.7], ["moo", 10.06], ["cattle, bovinae", 9.16]]], "duration": [1.29, 6.22, 2.23, 1.24, 0.63, 1.3, 0.34, 1.03, 2.94, 4.26, 5.04, 1.83, 1.21, 2.24, 15.77, 2.14, 44.66, 3.14]} \ No newline at end of file diff --git a/annotations_filtered/fEsN1FMfBvI_filtered.json b/annotations_filtered/fEsN1FMfBvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c34c56157c3d730607fcfd0c3052ba173081b2b1 --- /dev/null +++ b/annotations_filtered/fEsN1FMfBvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 4.09], [7.0, 9.66], [11.0, 12.82], [14.0, 14.4], [16.0, 16.55], [21.0, 22.01], [23.0, 23.43], [26.0, 26.15], [29.0, 30.18], [30.0, 38.45], [39.0, 40.74], [44.0, 53.74], [57.0, 58.99], [64.0, 64.83], [68.0, 117.05], [118.0, 152.96], [154.0, 159.34], [160.0, 160.51], [163.0, 175.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 38.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 18.92], ["fly, housefly", 9.7], ["speech", 7.58]], null, [["mains hum", 48.62], ["hum", 42.33], ["throbbing", 6.27]], null, null, null, null, [["music", 31.13], ["hum", 20.79], ["mains hum", 18.49]], null, [["mains hum", 31.02], ["hum", 26.92], ["music", 21.94]]], "duration": [0.52, 1.09, 2.66, 1.82, 0.4, 0.55, 1.01, 0.43, 0.15, 1.18, 8.45, 1.74, 9.74, 1.99, 0.83, 49.05, 34.96, 5.34, 0.51, 12.78]} \ No newline at end of file diff --git a/annotations_filtered/fEwSNiZ3zn4_filtered.json b/annotations_filtered/fEwSNiZ3zn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53051f32d62c0cf503d97963132da6962ea9f292 --- /dev/null +++ b/annotations_filtered/fEwSNiZ3zn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [9.0, 9.02], [10.0, 10.0], [13.0, 13.46], [14.0, 14.34], [17.0, 17.63], [19.0, 19.48], [21.0, 21.79], [28.0, 28.31], [29.0, 29.62], [32.0, 32.34], [38.0, 41.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 73.69], ["speech", 9.45], ["hum", 7.37]]], "duration": [0.23, 0.02, 0.0, 0.46, 0.34, 0.63, 0.48, 0.79, 0.31, 0.62, 0.34, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/fF12SZcPQ1s_filtered.json b/annotations_filtered/fF12SZcPQ1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8ce6167a65095508baa515d1a262f28e0c7dd49 --- /dev/null +++ b/annotations_filtered/fF12SZcPQ1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [7.0, 7.53], [10.0, 10.17], [12.0, 11.79], [13.0, 14.88], [25.0, 25.54], [30.0, 30.21], [35.0, 34.8], [38.0, 40.1]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 43.06], ["cattle, bovinae", 11.3], ["boing", 6.82]]], "duration": [0.48, 0.53, 0.17, -0.21, 1.88, 0.54, 0.21, -0.2, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/fFE8_U07a5I_filtered.json b/annotations_filtered/fFE8_U07a5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78be30610782bc77aa7e40dc6bcba99d58ac3310 --- /dev/null +++ b/annotations_filtered/fFE8_U07a5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.18], [6.0, 6.49], [7.0, 18.59], [19.0, 19.95], [20.0, 20.78], [25.0, 25.74], [29.0, 29.44], [31.0, 31.85], [35.0, 35.5], [45.0, 45.42], [49.0, 50.19], [52.0, 53.18], [54.0, 57.74], [59.0, 61.28], [63.0, 68.25], [69.0, 71.02], [71.0, 73.23], [74.0, 74.09], [76.0, 76.74], [78.0, 78.92], [80.0, 81.82], [85.0, 90.26], [93.0, 92.85], [94.0, 94.58], [96.0, 97.19], [97.0, 99.17], [101.0, 103.38], [104.0, 111.13], [112.0, 112.82], [113.0, 115.3], [116.0, 120.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 99.84, 100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 63.85, 100.0, 100.0, 0.0, 71.87, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.49, 11.59, 0.95, 0.78, 0.74, 0.44, 0.85, 0.5, 0.42, 1.19, 1.18, 3.74, 2.28, 5.25, 2.02, 2.23, 0.09, 0.74, 0.92, 1.82, 5.26, -0.15, 0.58, 1.19, 2.17, 2.38, 7.13, 0.82, 2.3, 4.34]} \ No newline at end of file diff --git a/annotations_filtered/fFUR02kaGTQ_filtered.json b/annotations_filtered/fFUR02kaGTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0814fab71c3f9b30f3a30fa6d1e1eb079ee7b2d0 --- /dev/null +++ b/annotations_filtered/fFUR02kaGTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [3.0, 4.36], [7.0, 9.21], [12.0, 12.65], [17.0, 18.5], [21.0, 22.65], [27.0, 29.02], [30.0, 31.36], [34.0, 35.7], [37.0, 39.61], [41.0, 43.24], [45.0, 46.33], [48.0, 66.16], [68.0, 68.88], [72.0, 73.28], [77.0, 77.6], [78.0, 81.87], [86.0, 89.09], [91.0, 95.05], [98.0, 101.29], [102.0, 102.71], [105.0, 105.48], [107.0, 109.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.91, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 100.0, 98.27, 99.95, 99.16, 0.0, 0.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 1.36, 2.21, 0.65, 1.5, 1.65, 2.02, 1.36, 1.7, 2.61, 2.24, 1.33, 18.16, 0.88, 1.28, 0.6, 3.87, 3.09, 4.05, 3.29, 0.71, 0.48, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/fFan929BTPE_filtered.json b/annotations_filtered/fFan929BTPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db7678468770bb7de80aef9c3e14c4f41542b1de --- /dev/null +++ b/annotations_filtered/fFan929BTPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.8], [19.0, 19.75], [25.0, 25.14], [26.0, 27.41], [29.0, 29.94], [31.0, 31.56], [32.0, 32.63], [33.0, 33.96], [34.0, 35.23], [36.0, 37.07], [38.0, 38.53], [54.0, 55.16], [60.0, 63.39], [72.0, 72.23], [74.0, 74.49], [85.0, 86.04], [87.0, 87.89], [94.0, 94.15], [96.0, 96.45], [98.0, 99.44], [103.0, 102.9], [106.0, 106.62], [110.0, 116.07], [116.0, 116.4], [116.0, 116.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 93.14], ["squish", 1.36], ["noise", 0.65]], null, null, null, null, null, null, null, null, null, [["speech", 57.41], ["hum", 5.45], ["throbbing", 4.91]], null, null], "duration": [1.8, 0.75, 0.14, 1.41, 0.94, 0.56, 0.63, 0.96, 1.23, 1.07, 0.53, 1.16, 3.39, 0.23, 0.49, 1.04, 0.89, 0.15, 0.45, 1.44, -0.1, 0.62, 6.07, 0.4, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/fGiaJDWSWKE_filtered.json b/annotations_filtered/fGiaJDWSWKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78e83f857b9652041f3690a41737f76289b2f4ab --- /dev/null +++ b/annotations_filtered/fGiaJDWSWKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.11], [1.0, 1.44], [3.0, 3.5], [8.0, 10.98], [15.0, 17.59], [22.0, 22.2], [24.0, 24.65], [25.0, 26.91], [28.0, 27.87], [28.0, 29.46], [31.0, 32.43], [37.0, 37.71], [39.0, 41.0], [49.0, 50.58], [52.0, 62.55], [69.0, 70.14], [75.0, 75.51], [76.0, 77.14], [79.0, 79.79], [81.0, 80.6], [82.0, 83.24], [84.0, 84.99], [88.0, 90.42], [93.0, 94.15], [95.0, 96.74], [100.0, 101.73], [103.0, 103.1], [107.0, 109.92], [114.0, 122.89], [125.0, 127.45], [130.0, 130.37], [131.0, 131.67], [136.0, 136.53], [139.0, 140.46], [141.0, 141.64], [143.0, 147.09], [151.0, 151.9], [155.0, 161.25], [165.0, 165.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 81.17, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 98.86, 80.11, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 0.0, 93.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.44, 0.5, 2.98, 2.59, 0.2, 0.65, 1.91, -0.13, 1.46, 1.43, 0.71, 2.0, 1.58, 10.55, 1.14, 0.51, 1.14, 0.79, -0.4, 1.24, 0.99, 2.42, 1.15, 1.74, 1.73, 0.1, 2.92, 8.89, 2.45, 0.37, 0.67, 0.53, 1.46, 0.64, 4.09, 0.9, 6.25, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/fGkSjNHEecA_filtered.json b/annotations_filtered/fGkSjNHEecA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0cc72c9383dce4ab3d589b7eba6e226ef4b4c60 --- /dev/null +++ b/annotations_filtered/fGkSjNHEecA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.53], [12.0, 13.24], [17.0, 60.37], [65.0, 70.75], [71.0, 71.78], [76.0, 114.59], [121.0, 124.11], [125.0, 125.12], [125.0, 128.12]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [30.53, 0.0, 0.0, 30.57, 0.0, 0.0, 31.87, 0.0, 30.8], "audiomae_on_audioset": [[["music", 47.51], ["electronic music", 8.8], ["cacophony", 4.15]], null, null, [["music", 28.26], ["throbbing", 25.91], ["hum", 18.13]], null, null, [["music", 50.87], ["scary music", 12.72], ["soundtrack music", 7.66]], null, [["music", 39.46], ["hum", 11.82], ["mains hum", 11.36]]], "duration": [4.53, 1.24, 43.37, 5.75, 0.78, 38.59, 3.11, 0.12, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/fHYuhwnlTZs_filtered.json b/annotations_filtered/fHYuhwnlTZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53c587d76cf505c245c57abb4f8267a67c61cb57 --- /dev/null +++ b/annotations_filtered/fHYuhwnlTZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.21], [13.0, 17.79], [20.0, 39.31], [40.0, 41.42], [43.0, 43.98], [46.0, 45.74], [47.0, 51.39], [52.0, 53.43], [54.0, 54.14], [54.0, 71.56], [72.0, 72.6], [73.0, 74.41], [75.0, 76.18], [77.0, 81.41], [83.0, 83.34], [83.0, 95.15], [96.0, 99.01], [100.0, 106.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.72, 98.86, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 80.82, 0.0, 99.16, 94.66, 98.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 4.79, 19.31, 1.42, 0.98, -0.26, 4.39, 1.43, 0.14, 17.56, 0.6, 1.41, 1.18, 4.41, 0.34, 12.15, 3.01, 6.17]} \ No newline at end of file diff --git a/annotations_filtered/fHerVxCsbyc_filtered.json b/annotations_filtered/fHerVxCsbyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44ed62312ebe93c1d4f4e5b6da7ee89076d45550 --- /dev/null +++ b/annotations_filtered/fHerVxCsbyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.9], [5.0, 11.15], [20.0, 22.27], [23.0, 24.49], [26.0, 26.97], [37.0, 37.57], [38.0, 38.99], [39.0, 39.46], [40.0, 41.94], [45.0, 47.28], [47.0, 47.49], [48.0, 48.66], [50.0, 50.16], [54.0, 55.92], [58.0, 59.43], [65.0, 65.25], [72.0, 73.04], [76.0, 77.6], [78.0, 83.74], [85.0, 86.34], [88.0, 88.38], [89.0, 89.65], [92.0, 91.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.83, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 65.98], ["fart", 7.99], ["radio", 4.37]], null, null, null, null, null, null, null, [["speech", 34.68], ["radio", 26.95], ["sidetone", 6.02]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 6.15, 2.27, 1.49, 0.97, 0.57, 0.99, 0.46, 1.94, 2.28, 0.49, 0.66, 0.16, 1.92, 1.43, 0.25, 1.04, 1.6, 5.74, 1.34, 0.38, 0.65, -0.34]} \ No newline at end of file diff --git a/annotations_filtered/fHmesxUDVz4_filtered.json b/annotations_filtered/fHmesxUDVz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e383464edce631c708813877b33261caafabfe1 --- /dev/null +++ b/annotations_filtered/fHmesxUDVz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.92], [16.0, 17.12], [37.0, 37.44], [40.0, 40.73], [42.0, 42.55], [45.0, 46.58], [47.0, 53.11], [54.0, 54.55], [56.0, 56.67], [60.0, 62.21], [63.0, 63.56], [67.0, 67.26], [69.0, 69.5], [71.0, 72.6]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 33.69, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["laughter", 9.42], ["crying, sobbing", 9.29], ["baby laughter", 9.16]], null, null, null, null], "duration": [-0.08, 1.12, 0.44, 0.73, 0.55, 1.58, 6.11, 0.55, 0.67, 2.21, 0.56, 0.26, 0.5, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/fIT7VMVju0A_filtered.json b/annotations_filtered/fIT7VMVju0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b667e8dc7efcd2b057eac71b20d0d429470f24f --- /dev/null +++ b/annotations_filtered/fIT7VMVju0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 26.2], [35.0, 36.41], [38.0, 46.63], [48.0, 51.16], [52.0, 71.74], [72.0, 73.28], [76.0, 76.91], [78.0, 78.24], [79.0, 78.88], [80.0, 82.0], [83.0, 82.9], [83.0, 93.53], [94.0, 95.0], [97.0, 99.06], [100.0, 101.83], [102.0, 103.32], [115.0, 116.06], [118.0, 122.55], [124.0, 128.44], [129.0, 143.01], [147.0, 155.55], [156.0, 166.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [72.6, 0.0, 86.64, 78.04, 34.82, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 49.4, 0.0, 96.89, 0.0, 0.0, 0.0, 88.1, 95.51, 30.87, 36.31, 31.4], "audiomae_on_audioset": [null, null, null, null, [["music", 47.0], ["hum", 19.4], ["throbbing", 8.02]], null, null, null, null, null, null, [["speech", 73.71], ["inside, small room", 3.11], ["hum", 2.64]], null, null, null, null, null, null, null, [["speech", 81.15], ["breaking", 4.14], ["music", 2.95]], [["music", 51.35], ["didgeridoo", 13.63], ["musical instrument", 4.19]], [["music", 48.46], ["sheep", 10.36], ["bleat", 9.3]]], "duration": [5.2, 1.41, 8.63, 3.16, 19.74, 1.28, 0.91, 0.24, -0.12, 2.0, -0.1, 10.53, 1.0, 2.06, 1.83, 1.32, 1.06, 4.55, 4.44, 14.01, 8.55, 10.82]} \ No newline at end of file diff --git a/annotations_filtered/fIfQbocblZc_filtered.json b/annotations_filtered/fIfQbocblZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..725bec80814ab09a4ef3d15345be2f6dbd167a81 --- /dev/null +++ b/annotations_filtered/fIfQbocblZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.63], [20.0, 20.49], [21.0, 24.0], [26.0, 26.67], [29.0, 30.13], [31.0, 34.62], [35.0, 36.88], [39.0, 50.95], [56.0, 55.61], [56.0, 58.82], [59.0, 65.87], [67.0, 114.57], [115.0, 131.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.94, 0.0, 0.0, 85.17, 0.0, 74.44, 0.0, 81.17, 73.51, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 0.49, 3.0, 0.67, 1.13, 3.62, 1.88, 11.95, -0.39, 2.82, 6.87, 47.57, 16.79]} \ No newline at end of file diff --git a/annotations_filtered/fIh6HDeXKGY_filtered.json b/annotations_filtered/fIh6HDeXKGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..095f82dd7d7b4bdbc3e053d2df916d6efb04eb4e --- /dev/null +++ b/annotations_filtered/fIh6HDeXKGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.84], [15.0, 15.67], [16.0, 17.61], [19.0, 20.09], [22.0, 22.0], [24.0, 24.14], [26.0, 26.79], [33.0, 34.03], [36.0, 37.1], [39.0, 39.99], [42.0, 47.58], [50.0, 50.31], [52.0, 52.49], [54.0, 54.51], [56.0, 55.73], [59.0, 59.58], [61.0, 61.05], [66.0, 66.82], [70.0, 74.46], [79.0, 79.29], [109.0, 109.56], [111.0, 115.11], [116.0, 116.46], [120.0, 120.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.66, 0.0, 0.0, 86.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["eruption", 15.77], ["explosion", 15.02], ["noise", 13.18]], null, null, null, null, null, null, null, [["noise", 9.69], ["music", 7.71], ["eruption", 7.53]], null, null, null, null, null], "duration": [-0.16, 0.67, 1.61, 1.09, 0.0, 0.14, 0.79, 1.03, 1.1, 0.99, 5.58, 0.31, 0.49, 0.51, -0.27, 0.58, 0.05, 0.82, 4.46, 0.29, 0.56, 4.11, 0.46, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/fImqZCIebuw_filtered.json b/annotations_filtered/fImqZCIebuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b4a1fd91f9ca5fce7afee647b9cec0fd96bdde --- /dev/null +++ b/annotations_filtered/fImqZCIebuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.04], [14.0, 39.43], [41.0, 42.13]], "keep_status": [false, true, false], "silence_prob": [58.38, 33.14, 0.0], "audiomae_on_audioset": [null, [["music", 51.43], ["hum", 8.14], ["drum machine", 7.96]], null], "duration": [2.04, 25.43, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/fJBrWMxc_P4_filtered.json b/annotations_filtered/fJBrWMxc_P4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d79a6fd4424d976133484bfec51a1773f2ed24b --- /dev/null +++ b/annotations_filtered/fJBrWMxc_P4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.56], [8.0, 25.29], [28.0, 29.44], [32.0, 32.0], [35.0, 36.96], [38.0, 42.63], [46.0, 48.46], [51.0, 61.25], [64.0, 68.45], [71.0, 71.2], [71.0, 74.39], [76.0, 77.38]], "keep_status": [false, true, false, false, false, false, true, false, true, false, true, false], "silence_prob": [0.0, 39.01, 0.0, 0.0, 0.0, 36.99, 38.83, 37.58, 40.57, 0.0, 39.75, 0.0], "audiomae_on_audioset": [null, [["music", 32.69], ["singing bowl", 16.48], ["hum", 15.95]], null, null, null, [["music", 70.04], ["speech", 7.96], ["singing bowl", 3.54]], [["music", 50.11], ["singing bowl", 12.29], ["ambient music", 5.46]], [["music", 54.34], ["speech", 13.06], ["singing bowl", 3.02]], [["music", 51.23], ["effects unit", 7.16], ["hum", 5.51]], null, [["music", 47.45], ["hum", 12.06], ["throbbing", 6.33]], null], "duration": [1.56, 17.29, 1.44, 0.0, 1.96, 4.63, 2.46, 10.25, 4.45, 0.2, 3.39, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/fJV0KtMZ7x8_filtered.json b/annotations_filtered/fJV0KtMZ7x8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9b4cbb9f3a2661a3a2dc30a66098b97b85a6d89 --- /dev/null +++ b/annotations_filtered/fJV0KtMZ7x8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.01], [15.0, 16.24], [17.0, 18.08], [18.0, 18.47], [19.0, 24.93], [26.0, 25.83], [26.0, 26.2], [27.0, 27.33], [35.0, 35.75], [37.0, 37.59], [39.0, 40.85], [41.0, 42.16], [53.0, 53.0], [55.0, 58.43], [79.0, 79.66], [92.0, 92.2], [95.0, 96.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.97, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.35], ["moo", 15.58], ["cattle, bovinae", 9.85]], null, null, null], "duration": [5.01, 1.24, 1.08, 0.47, 5.93, -0.17, 0.2, 0.33, 0.75, 0.59, 1.85, 1.16, 0.0, 3.43, 0.66, 0.2, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/fJlJX4Rj_WU_filtered.json b/annotations_filtered/fJlJX4Rj_WU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f7158b2a30fbbef9411cfe3761e1a6ca4a24cee --- /dev/null +++ b/annotations_filtered/fJlJX4Rj_WU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [12.0, 12.82], [14.0, 15.03], [16.0, 16.14], [18.0, 19.23], [23.0, 22.84], [25.0, 26.54], [28.0, 28.07], [28.0, 28.95], [29.0, 29.07], [33.0, 48.69], [51.0, 57.52], [60.0, 60.34], [61.0, 70.51], [76.0, 76.32], [81.0, 81.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.16, 30.63, 0.0, 30.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 61.02], ["quack", 24.13], ["boing", 5.88]], [["music", 56.39], ["didgeridoo", 5.85], ["boing", 5.69]], null, [["music", 19.55], ["siren", 16.69], ["emergency vehicle", 13.44]], null, null], "duration": [0.72, 0.82, 1.03, 0.14, 1.23, -0.16, 1.54, 0.07, 0.95, 0.07, 15.69, 6.52, 0.34, 9.51, 0.32, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/fKGjSXtCou4_filtered.json b/annotations_filtered/fKGjSXtCou4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..301da6ecfc9bb51ca72d26ceac25daae71e0ed69 --- /dev/null +++ b/annotations_filtered/fKGjSXtCou4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [5.0, 6.56], [7.0, 7.42], [9.0, 9.36], [11.0, 16.68], [19.0, 21.81], [22.0, 22.23], [22.0, 22.47], [22.0, 25.03], [26.0, 31.04], [34.0, 39.04], [40.0, 59.44], [59.0, 59.51], [60.0, 60.84], [61.0, 61.15], [61.0, 64.22], [65.0, 76.52], [79.0, 80.72], [82.0, 89.48], [91.0, 94.83], [99.0, 100.82], [102.0, 102.91], [105.0, 106.08], [111.0, 121.83]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.82, 31.79, 0.0, 0.0, 29.74, 63.74, 67.76, 47.12, 0.0, 0.0, 0.0, 48.69, 31.48, 0.0, 28.98, 36.31, 0.0, 0.0, 0.0, 28.68], "audiomae_on_audioset": [null, null, null, null, [["didgeridoo", 58.49], ["music", 30.43], ["electronic music", 2.25]], [["music", 28.12], ["whale vocalization", 18.84], ["didgeridoo", 11.14]], null, null, [["didgeridoo", 45.21], ["whale vocalization", 13.65], ["speech", 6.66]], null, null, [["music", 60.36], ["hum", 8.74], ["mains hum", 2.05]], null, null, null, [["music", 70.75], ["theremin", 14.19], ["shofar", 2.3]], [["music", 32.7], ["didgeridoo", 12.03], ["hum", 11.47]], null, [["music", 48.87], ["hum", 10.75], ["mains hum", 7.09]], [["music", 49.84], ["didgeridoo", 15.34], ["theremin", 4.52]], null, null, null, [["speech", 40.09], ["music", 12.13], ["explosion", 10.2]]], "duration": [0.55, 1.56, 0.42, 0.36, 5.68, 2.81, 0.23, 0.47, 3.03, 5.04, 5.04, 19.44, 0.51, 0.84, 0.15, 3.22, 11.52, 1.72, 7.48, 3.83, 1.82, 0.91, 1.08, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/fKaiHVTL5nQ_filtered.json b/annotations_filtered/fKaiHVTL5nQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cab9717ec2863bd04bb0c1db975cce23034b6a4 --- /dev/null +++ b/annotations_filtered/fKaiHVTL5nQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 62.02], [64.0, 65.08], [67.0, 78.88]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, [["throbbing", 35.51], ["mains hum", 18.72], ["hum", 17.4]]], "duration": [56.02, 1.08, 11.88]} \ No newline at end of file diff --git a/annotations_filtered/fKeNgrRRoN8_filtered.json b/annotations_filtered/fKeNgrRRoN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc6bae160be2e5cb5e32a75eac4d57486fbbe7c --- /dev/null +++ b/annotations_filtered/fKeNgrRRoN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [9.0, 10.91], [13.0, 13.02], [15.0, 33.76], [35.0, 53.28]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.12, 30.73], "audiomae_on_audioset": [null, null, null, [["music", 46.12], ["throbbing", 32.73], ["hum", 7.54]], [["music", 73.87], ["throbbing", 8.86], ["hum", 4.82]]], "duration": [1.3, 1.91, 0.02, 18.76, 18.28]} \ No newline at end of file diff --git a/annotations_filtered/fKncYRJQRC8_filtered.json b/annotations_filtered/fKncYRJQRC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c97a65aa82a5d787b09ad54d6e1a9ea5083f382 --- /dev/null +++ b/annotations_filtered/fKncYRJQRC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.94], [12.0, 13.14], [13.0, 13.59], [14.0, 14.18], [15.0, 15.9], [17.0, 16.75], [17.0, 17.34], [18.0, 19.06], [19.0, 19.6], [22.0, 23.23], [36.0, 35.94], [42.0, 42.79], [44.0, 44.52], [48.0, 48.63], [52.0, 54.08], [64.0, 64.79], [65.0, 66.7], [72.0, 71.88], [74.0, 73.75], [74.0, 74.95], [77.0, 88.2], [92.0, 93.21], [97.0, 97.98], [98.0, 98.81], [99.0, 100.7], [102.0, 101.78], [103.0, 103.28], [105.0, 105.71], [112.0, 114.94], [116.0, 116.14], [120.0, 120.39], [124.0, 124.11], [126.0, 127.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 0.0, 0.0, 0.0, 35.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 18.57], ["speech", 13.99], ["hum", 12.42]], null, null, null, null, null, [["speech", 50.46], ["sidetone", 13.25], ["hum", 7.16]], null, null, null, null, null, null, null, [["speech", 65.42], ["wood", 4.6], ["vehicle", 2.41]], null, null, null, null], "duration": [1.94, 1.14, 0.59, 0.18, 0.9, -0.25, 0.34, 1.06, 0.6, 1.23, -0.06, 0.79, 0.52, 0.63, 2.08, 0.79, 1.7, -0.12, -0.25, 0.95, 11.2, 1.21, 0.98, 0.81, 1.7, -0.22, 0.28, 0.71, 2.94, 0.14, 0.39, 0.11, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/fKoYXxN6x98_filtered.json b/annotations_filtered/fKoYXxN6x98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7017a27a874efef8968da7b34d2404fb54ea7fd --- /dev/null +++ b/annotations_filtered/fKoYXxN6x98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [8.0, 9.66], [11.0, 11.79], [14.0, 15.21], [21.0, 22.15], [29.0, 29.46], [30.0, 30.74], [33.0, 33.35], [39.0, 41.32], [42.0, 47.16], [55.0, 57.72], [59.0, 108.23], [109.0, 110.34], [111.0, 129.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 32.09, 35.75, 0.0, 0.0, 53.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 58.03], ["music", 20.08], ["sidetone", 4.51]], [["music", 40.51], ["speech", 31.75], ["hum", 7.15]], null, null, null], "duration": [-0.06, 1.66, 0.79, 1.21, 1.15, 0.46, 0.74, 0.35, 2.32, 5.16, 2.72, 49.23, 1.34, 18.27]} \ No newline at end of file diff --git a/annotations_filtered/fKpKz3dysY0_filtered.json b/annotations_filtered/fKpKz3dysY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bfde46f16cf0153628b184ed29e74e870467a30 --- /dev/null +++ b/annotations_filtered/fKpKz3dysY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.53], [11.0, 20.01], [21.0, 26.94], [33.0, 39.43], [47.0, 47.43], [57.0, 57.84], [67.0, 67.85], [71.0, 71.51], [73.0, 89.33], [92.0, 96.65], [100.0, 101.76], [105.0, 116.68]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [40.33, 43.38, 66.15, 37.49, 0.0, 0.0, 0.0, 0.0, 28.38, 33.08, 0.0, 29.49], "audiomae_on_audioset": [[["music", 54.65], ["ambient music", 4.27], ["musical instrument", 3.55]], [["hum", 36.31], ["speech", 22.1], ["mains hum", 13.92]], null, [["speech", 56.96], ["music", 18.95], ["hum", 6.01]], null, null, null, null, [["music", 50.46], ["speech", 11.82], ["hum", 7.89]], [["mains hum", 27.35], ["hum", 24.83], ["music", 19.31]], null, [["music", 56.0], ["buzz", 5.52], ["hum", 5.28]]], "duration": [2.53, 9.01, 5.94, 6.43, 0.43, 0.84, 0.85, 0.51, 16.33, 4.65, 1.76, 11.68]} \ No newline at end of file diff --git a/annotations_filtered/fL4j9mZfUdg_filtered.json b/annotations_filtered/fL4j9mZfUdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5534e6b98672b4e7cfa4a81a02ad8eead25922db --- /dev/null +++ b/annotations_filtered/fL4j9mZfUdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 55.32], [59.0, 93.14], [95.0, 127.11]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [30.32, 34.14, 32.11]} \ No newline at end of file diff --git a/annotations_filtered/fLWjUBClszw_filtered.json b/annotations_filtered/fLWjUBClszw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc581d7eddf0ec77e0e33feb55f64d3d82b990d1 --- /dev/null +++ b/annotations_filtered/fLWjUBClszw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [5.0, 5.44], [6.0, 19.33], [20.0, 23.09], [26.0, 84.2], [86.0, 87.2], [89.0, 92.21], [96.0, 97.53], [99.0, 99.54], [102.0, 105.73], [107.0, 107.08], [108.0, 109.9], [113.0, 112.89], [118.0, 126.72], [130.0, 172.4], [175.0, 186.9]], "keep_status": [false, false, true, true, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.66, 29.96, 0.0, 0.0, 47.12, 0.0, 0.0, 35.07, 0.0, 0.0, 0.0, 36.32, 0.0, 34.64], "audiomae_on_audioset": [null, null, [["fart", 27.39], ["speech", 14.73], ["music", 10.8]], [["vehicle", 42.26], ["race car, auto racing", 10.21], ["car", 8.9]], null, null, [["fart", 22.58], ["hiccup", 5.71], ["didgeridoo", 5.55]], null, null, [["hum", 27.13], ["mains hum", 7.93], ["music", 7.46]], null, null, null, [["music", 53.95], ["didgeridoo", 22.25], ["musical instrument", 3.12]], null, [["music", 70.39], ["soundtrack music", 3.63], ["scary music", 3.26]]], "duration": [1.43, 0.44, 13.33, 3.09, 58.2, 1.2, 3.21, 1.53, 0.54, 3.73, 0.08, 1.9, -0.11, 8.72, 42.4, 11.9]} \ No newline at end of file diff --git a/annotations_filtered/fLpmswBKVN4_filtered.json b/annotations_filtered/fLpmswBKVN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3d35b3c69a6772526cdc3e14a0cc0ee321f3bb2 --- /dev/null +++ b/annotations_filtered/fLpmswBKVN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.82], [15.0, 16.14], [30.0, 30.45], [40.0, 43.06]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 40.14], "audiomae_on_audioset": [null, null, null, [["speech", 27.81], ["chicken, rooster", 9.73], ["fowl", 7.75]]], "duration": [1.82, 1.14, 0.45, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/fLswSc81mw8_filtered.json b/annotations_filtered/fLswSc81mw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bf877ccba06f256464fe879e1b80db4fa002bfd --- /dev/null +++ b/annotations_filtered/fLswSc81mw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 34.23], [36.0, 46.52], [47.0, 59.31], [60.0, 63.48], [64.0, 67.41], [68.0, 77.03], [79.0, 79.64], [84.0, 85.11], [90.0, 92.52], [97.0, 100.94], [102.0, 104.87], [106.0, 107.4], [114.0, 113.88], [115.0, 124.95]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [31.26, 30.58, 36.58, 49.64, 85.54, 46.64, 0.0, 0.0, 97.54, 32.1, 33.65, 0.0, 0.0, 41.95], "audiomae_on_audioset": [[["music", 31.39], ["grunt", 21.09], ["burping, eructation", 15.74]], [["music", 66.69], ["speech", 5.46], ["boing", 3.03]], [["music", 75.38], ["speech", 5.04], ["buzz", 1.91]], [["music", 65.52], ["speech", 3.52], ["electronic music", 2.32]], null, [["music", 57.16], ["music for children", 12.17], ["boing", 10.51]], null, null, null, [["music", 23.27], ["fly, housefly", 17.91], ["mosquito", 10.5]], [["speech", 19.84], ["fart", 15.5], ["hum", 7.0]], null, null, [["music", 62.46], ["speech", 2.78], ["musical instrument", 2.49]]], "duration": [9.23, 10.52, 12.31, 3.48, 3.41, 9.03, 0.64, 1.11, 2.52, 3.94, 2.87, 1.4, -0.12, 9.95]} \ No newline at end of file diff --git a/annotations_filtered/fLvEcBoOpnQ_filtered.json b/annotations_filtered/fLvEcBoOpnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f92c1e44fc35b17be9282ee11835a2340a04ea83 --- /dev/null +++ b/annotations_filtered/fLvEcBoOpnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.32], [10.0, 15.89], [17.0, 39.92], [42.0, 43.65], [45.0, 45.44], [46.0, 49.76], [51.0, 51.02], [55.0, 55.17]], "keep_status": [false, true, true, false, false, true, false, false], "silence_prob": [0.0, 31.21, 30.63, 0.0, 0.0, 31.03, 0.0, 0.0], "audiomae_on_audioset": [null, [["insect", 20.73], ["fly, housefly", 18.54], ["speech", 13.6]], [["speech", 26.44], ["music", 21.49], ["vehicle", 5.8]], null, null, [["music", 38.72], ["speech", 18.99], ["buzz", 4.8]], null, null], "duration": [1.32, 5.89, 22.92, 1.65, 0.44, 3.76, 0.02, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/fM3FUot8TCY_filtered.json b/annotations_filtered/fM3FUot8TCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1710394383eac4d6baa264ac7ea6b0b97cc7be0d --- /dev/null +++ b/annotations_filtered/fM3FUot8TCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [7.0, 7.94], [10.0, 10.5], [14.0, 15.89], [36.0, 37.44], [39.0, 38.97], [39.0, 41.64], [43.0, 48.79], [51.0, 51.51], [56.0, 57.13], [60.0, 60.3], [87.0, 87.88], [93.0, 93.41], [110.0, 110.76], [113.0, 121.27]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 35.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 41.02], ["bee, wasp, etc.", 19.33], ["insect", 18.28]], [["music", 51.08], ["musical instrument", 8.02], ["theremin", 4.06]], null, null, null, null, null, null, [["vehicle", 42.79], ["speech", 13.39], ["car", 13.37]]], "duration": [1.7, 0.94, 0.5, 1.89, 1.44, -0.03, 2.64, 5.79, 0.51, 1.13, 0.3, 0.88, 0.41, 0.76, 8.27]} \ No newline at end of file diff --git a/annotations_filtered/fMTn4M2qfNI_filtered.json b/annotations_filtered/fMTn4M2qfNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99e830d473e2d9d4de39e2ad053e4276fcc5affd --- /dev/null +++ b/annotations_filtered/fMTn4M2qfNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.59], [7.0, 7.8], [9.0, 10.4], [12.0, 12.82], [14.0, 15.03], [16.0, 16.97], [18.0, 20.93], [23.0, 24.06], [29.0, 29.44], [41.0, 44.41], [47.0, 47.73], [49.0, 49.35], [73.0, 73.43]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 0.0, 32.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 37.74], ["cattle, bovinae", 6.08], ["whale vocalization", 4.64]], null, null, [["sound effect", 17.56], ["speech", 16.83], ["livestock, farm animals, working animals", 14.04]], null, null, null], "duration": [1.59, 0.8, 1.4, 0.82, 1.03, 0.97, 2.93, 1.06, 0.44, 3.41, 0.73, 0.35, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/fMxA90YU2Jw_filtered.json b/annotations_filtered/fMxA90YU2Jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b1378a235bc9e08af59188cf1d67fbf86a94b2 --- /dev/null +++ b/annotations_filtered/fMxA90YU2Jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [6.0, 7.72], [8.0, 8.51], [13.0, 14.23], [15.0, 15.33], [16.0, 18.42], [20.0, 24.04], [43.0, 44.78], [62.0, 63.22], [64.0, 64.39], [70.0, 71.27], [72.0, 74.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.71, 0.0, 0.0, 0.0, 0.0, 55.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.72, 0.51, 1.23, 0.33, 2.42, 4.04, 1.78, 1.22, 0.39, 1.27, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/fN2AXsF-kwc_filtered.json b/annotations_filtered/fN2AXsF-kwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0432fb480639e171352ca1d6fff21e9c5cca82 --- /dev/null +++ b/annotations_filtered/fN2AXsF-kwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [21.0, 22.54], [31.0, 33.62], [34.0, 36.64], [41.0, 42.2], [46.0, 46.43], [55.0, 71.86], [74.0, 83.54], [94.0, 94.49], [96.0, 96.57], [98.0, 99.66], [103.0, 103.18], [105.0, 105.53], [107.0, 108.31]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.72, 45.27, 0.0, 0.0, 30.19, 32.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 22.22], ["music", 21.48], ["hum", 19.9]], null, null, [["livestock, farm animals, working animals", 21.25], ["moo", 20.62], ["cattle, bovinae", 18.61]], [["music", 46.92], ["speech", 7.35], ["vehicle", 7.01]], null, null, null, null, null, null], "duration": [0.56, 1.54, 2.62, 2.64, 1.2, 0.43, 16.86, 9.54, 0.49, 0.57, 1.66, 0.18, 0.53, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/fNMtHosai08_filtered.json b/annotations_filtered/fNMtHosai08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8760998625aadf5f3839fb699cc37ff8ac24e2f --- /dev/null +++ b/annotations_filtered/fNMtHosai08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.24], [4.0, 4.36], [7.0, 13.61], [16.0, 17.02], [19.0, 19.87], [21.0, 21.64], [24.0, 24.81], [28.0, 28.16], [29.0, 29.73], [30.0, 30.99], [32.0, 32.61], [34.0, 34.11], [37.0, 37.45], [38.0, 39.7], [40.0, 40.8], [41.0, 42.55], [44.0, 45.67], [55.0, 56.54], [60.0, 60.44], [65.0, 64.86], [69.0, 71.71], [73.0, 74.92], [87.0, 86.83], [90.0, 92.26], [93.0, 93.9], [96.0, 97.14], [98.0, 102.07]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 68.93, 0.0, 0.0, 35.73], "audiomae_on_audioset": [null, null, [["groan", 29.69], ["speech", 14.97], ["rumble", 13.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.9], ["sidetone", 4.66], ["music", 3.88]]], "duration": [0.24, 0.36, 6.61, 1.02, 0.87, 0.64, 0.81, 0.16, 0.73, 0.99, 0.61, 0.11, 0.45, 1.7, 0.8, 1.55, 1.67, 1.54, 0.44, -0.14, 2.71, 1.92, -0.17, 2.26, 0.9, 1.14, 4.07]} \ No newline at end of file diff --git a/annotations_filtered/fNjMYPeG8IU_filtered.json b/annotations_filtered/fNjMYPeG8IU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a33c37346176589e94bf01fb5298342c0d4419ce --- /dev/null +++ b/annotations_filtered/fNjMYPeG8IU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.2], [3.0, 3.75], [4.0, 11.13], [13.0, 19.43], [23.0, 26.27], [27.0, 40.64], [62.0, 63.76], [67.0, 66.88], [74.0, 77.03], [78.0, 80.69], [81.0, 82.49], [86.0, 87.02], [88.0, 88.11], [89.0, 89.78], [96.0, 97.53], [98.0, 98.95], [102.0, 103.0], [109.0, 109.54], [111.0, 111.67], [113.0, 116.36], [119.0, 121.68], [122.0, 121.71], [122.0, 121.74], [122.0, 121.9], [125.0, 125.91]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.78, 45.27, 47.94, 45.65, 0.0, 0.0, 44.23, 43.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 41.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.86], ["musical instrument", 6.19], ["theremin", 6.11]], [["music", 20.5], ["cello", 17.9], ["bowed string instrument", 14.32]], [["music", 67.02], ["musical instrument", 2.24], ["hum", 2.03]], [["music", 61.79], ["musical instrument", 6.69], ["foghorn", 5.54]], null, null, [["insect", 17.55], ["fly, housefly", 16.32], ["speech", 14.49]], [["sidetone", 51.96], ["speech", 26.03], ["radio", 5.04]], null, null, null, null, null, null, null, null, null, null, [["speech", 67.59], ["animal", 3.3], ["music", 2.07]], null, null, null, null], "duration": [0.2, 0.75, 7.13, 6.43, 3.27, 13.64, 1.76, -0.12, 3.03, 2.69, 1.49, 1.02, 0.11, 0.78, 1.53, 0.95, 1.0, 0.54, 0.67, 3.36, 2.68, -0.29, -0.26, -0.1, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/fO8fKHbg4kw_filtered.json b/annotations_filtered/fO8fKHbg4kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14ebefc45f2d4270a38194f398deea18c773550e --- /dev/null +++ b/annotations_filtered/fO8fKHbg4kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [7.0, 12.55], [19.0, 18.84], [25.0, 29.42], [32.0, 32.85], [63.0, 64.3]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 30.67, 0.0, 29.89, 0.0, 0.0], "audiomae_on_audioset": [null, [["applause", 31.03], ["speech", 29.12], ["crowd", 15.94]], null, [["speech", 35.84], ["music", 10.11], ["crowd", 8.08]], null, null], "duration": [1.06, 5.55, -0.16, 4.42, 0.85, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/fOONIlhXFh4_filtered.json b/annotations_filtered/fOONIlhXFh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd484b1741fbff0caab83c543d14270d9bbc9f7d --- /dev/null +++ b/annotations_filtered/fOONIlhXFh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.43], [10.0, 10.83], [13.0, 13.96], [16.0, 17.95], [22.0, 23.53], [25.0, 26.64], [28.0, 32.85], [35.0, 36.24], [38.0, 39.68], [41.0, 41.93], [42.0, 42.48], [44.0, 45.37], [46.0, 48.71], [52.0, 53.65], [59.0, 60.79], [68.0, 67.9], [68.0, 68.99], [69.0, 69.58], [70.0, 70.77], [74.0, 74.48], [76.0, 76.98], [79.0, 79.91], [87.0, 88.37], [91.0, 91.66], [97.0, 97.8], [109.0, 109.44], [110.0, 110.94], [113.0, 114.49], [117.0, 117.02], [119.0, 119.53], [121.0, 122.91], [123.0, 127.89], [133.0, 133.54], [134.0, 134.7], [136.0, 136.71], [137.0, 138.92], [141.0, 154.53]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.06, 0.0, 0.0, 0.0, 0.0, 0.0, 42.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 41.42], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 13.46], ["mains hum", 12.73], ["speech", 9.11]], null, null, null, null, null, [["hum", 22.82], ["throbbing", 17.18], ["rumble", 16.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 33.08], ["mains hum", 13.57], ["sonar", 11.64]], null, null, null, null, [["rumble", 60.89], ["hum", 8.65], ["mains hum", 4.11]]], "duration": [1.43, 0.83, 0.96, 1.95, 1.53, 1.64, 4.85, 1.24, 1.68, 0.93, 0.48, 1.37, 2.71, 1.65, 1.79, -0.1, 0.99, 0.58, 0.77, 0.48, 0.98, 0.91, 1.37, 0.66, 0.8, 0.44, 0.94, 1.49, 0.02, 0.53, 1.91, 4.89, 0.54, 0.7, 0.71, 1.92, 13.53]} \ No newline at end of file diff --git a/annotations_filtered/fOSuCsgJ26M_filtered.json b/annotations_filtered/fOSuCsgJ26M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..491693cd274e67496b2f5246481560d749034de0 --- /dev/null +++ b/annotations_filtered/fOSuCsgJ26M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 55.8], [58.0, 68.22], [70.0, 85.16], [87.0, 94.88], [96.0, 104.43], [105.0, 106.83], [108.0, 108.84]], "keep_status": [false, false, true, false, true, false, false], "silence_prob": [76.7, 72.31, 35.52, 70.3, 43.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.58], ["speech", 14.73], ["explosion", 13.18]], null, [["speech", 33.43], ["music", 20.46], ["didgeridoo", 9.64]], null, null], "duration": [6.8, 10.22, 15.16, 7.88, 8.43, 1.83, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/fOv_N9k5im4_filtered.json b/annotations_filtered/fOv_N9k5im4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4cc7c7808d896afddd4b8ec2ccfe89cf37066c6 --- /dev/null +++ b/annotations_filtered/fOv_N9k5im4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.97], [29.0, 34.03], [35.0, 36.85], [39.0, 38.82], [44.0, 44.37], [46.0, 47.07], [49.0, 50.6], [56.0, 58.24], [62.0, 68.96], [73.0, 73.94], [75.0, 81.9], [85.0, 98.24], [99.0, 101.76], [104.0, 105.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 78.38, 0.0, 83.52, 45.33, 80.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 44.51], ["cello", 16.48], ["theremin", 9.99]], null, null], "duration": [0.97, 5.03, 1.85, -0.18, 0.37, 1.07, 1.6, 2.24, 6.96, 0.94, 6.9, 13.24, 2.76, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/fPEGcx4MFHI_filtered.json b/annotations_filtered/fPEGcx4MFHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3a1049a96065bed641a5949ff66565654d816e1 --- /dev/null +++ b/annotations_filtered/fPEGcx4MFHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.51], [17.0, 17.95], [20.0, 20.53], [29.0, 30.59], [32.0, 84.64], [85.0, 109.04], [110.0, 110.49]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 40.08], ["hum", 24.21], ["mains hum", 16.98]], null], "duration": [1.51, 0.95, 0.53, 1.59, 52.64, 24.04, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/fPUJS7w4Dag_filtered.json b/annotations_filtered/fPUJS7w4Dag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a876d14d34dcd1134a2f05991282a8c0d95e14b --- /dev/null +++ b/annotations_filtered/fPUJS7w4Dag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.72], [8.0, 10.2], [14.0, 16.23], [18.0, 18.44], [19.0, 22.86], [25.0, 29.79], [30.0, 47.11], [49.0, 57.05], [59.0, 60.45], [62.0, 69.65], [71.0, 131.9], [132.0, 132.07]], "keep_status": [false, true, true, false, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 38.27, 40.5, 0.0, 44.75, 46.64, 46.5, 41.22, 0.0, 37.38, 0.0, 0.0], "audiomae_on_audioset": [null, [["fowl", 27.54], ["goose", 15.74], ["honk", 15.63]], [["throbbing", 23.13], ["hum", 17.47], ["speech", 4.68]], null, [["hum", 43.18], ["throbbing", 14.14], ["mains hum", 6.95]], [["hum", 18.33], ["bee, wasp, etc.", 13.32], ["fly, housefly", 10.78]], [["speech", 52.99], ["hum", 20.46], ["throbbing", 6.23]], [["fly, housefly", 17.23], ["bee, wasp, etc.", 11.87], ["livestock, farm animals, working animals", 10.12]], null, [["fly, housefly", 18.95], ["hum", 10.96], ["insect", 8.8]], null, null], "duration": [1.72, 2.2, 2.23, 0.44, 3.86, 4.79, 17.11, 8.05, 1.45, 7.65, 60.9, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/fPcbyFeefXs_filtered.json b/annotations_filtered/fPcbyFeefXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..498cf21057354211af86f907a4d183fa3219e8b2 --- /dev/null +++ b/annotations_filtered/fPcbyFeefXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.91], [36.0, 37.54], [43.0, 43.9], [60.0, 59.73], [60.0, 61.1], [63.0, 63.29], [64.0, 64.18], [77.0, 77.57], [81.0, 80.82], [82.0, 84.72], [85.0, 86.14], [90.0, 90.59], [114.0, 114.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 1.54, 0.9, -0.27, 1.1, 0.29, 0.18, 0.57, -0.18, 2.72, 1.14, 0.59, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/fPk-Dms1rJc_filtered.json b/annotations_filtered/fPk-Dms1rJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..263d618a145e0958e6892797ad92d293310682f5 --- /dev/null +++ b/annotations_filtered/fPk-Dms1rJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [3.0, 3.1], [19.0, 19.65], [20.0, 21.86], [31.0, 32.9], [35.0, 81.63], [83.0, 83.2], [86.0, 90.83], [92.0, 107.97], [113.0, 113.39], [118.0, 118.72], [120.0, 120.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 50.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.1, 0.65, 1.86, 1.9, 46.63, 0.2, 4.83, 15.97, 0.39, 0.72, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/fQ09ePfYLpU_filtered.json b/annotations_filtered/fQ09ePfYLpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01f32f41e0768f6414246232e39f3b9b9f023448 --- /dev/null +++ b/annotations_filtered/fQ09ePfYLpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.82], [25.0, 25.95], [29.0, 29.54], [30.0, 30.5], [46.0, 60.44], [71.0, 72.66], [77.0, 78.11], [85.0, 86.91], [99.0, 100.04], [103.0, 103.28], [104.0, 105.97], [111.0, 111.74], [116.0, 117.78], [118.0, 118.96], [122.0, 122.66], [125.0, 125.14], [125.0, 127.13], [131.0, 135.3], [144.0, 144.22], [145.0, 146.85], [153.0, 155.95], [163.0, 164.47], [165.0, 166.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.79, 31.05, 0.0, 0.0, 29.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 72.26], ["livestock, farm animals, working animals", 10.85], ["cattle, bovinae", 2.47]], null, null, null, null, null, null, null, null, null, null, null, [["music", 32.48], ["mains hum", 10.14], ["buzz", 9.86]], [["hum", 31.77], ["mains hum", 25.91], ["music", 14.92]], null, null, [["music", 21.43], ["noise", 14.16], ["boing", 10.64]], null, null], "duration": [-0.18, 0.95, 0.54, 0.5, 14.44, 1.66, 1.11, 1.91, 1.04, 0.28, 1.97, 0.74, 1.78, 0.96, 0.66, 0.14, 2.13, 4.3, 0.22, 1.85, 2.95, 1.47, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/fQEGMNLTYPs_filtered.json b/annotations_filtered/fQEGMNLTYPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4848754edccac86f9d82800fdf62f6045d1d5320 --- /dev/null +++ b/annotations_filtered/fQEGMNLTYPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 126.94], [127.0, 129.78], [132.0, 137.1]], "keep_status": [false, true, true], "silence_prob": [0.0, 28.92, 31.64], "audiomae_on_audioset": [null, [["noise", 32.81], ["music", 17.66], ["didgeridoo", 10.81]], [["vehicle", 35.17], ["car", 10.01], ["speech", 5.54]]], "duration": [77.94, 2.78, 5.1]} \ No newline at end of file diff --git a/annotations_filtered/fQWMKUF7dvA_filtered.json b/annotations_filtered/fQWMKUF7dvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eac71f5041df06cdd16da42ee73cab129b2a237 --- /dev/null +++ b/annotations_filtered/fQWMKUF7dvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [4.0, 6.3], [7.0, 7.1], [7.0, 9.26], [10.0, 10.4], [11.0, 12.93], [14.0, 14.76], [17.0, 17.68], [19.0, 21.52], [30.0, 30.84], [41.0, 42.77], [44.0, 46.79], [48.0, 53.57], [67.0, 67.85], [72.0, 73.16], [77.0, 77.25], [78.0, 78.38], [81.0, 81.19], [82.0, 83.03], [86.0, 86.88], [88.0, 88.92], [90.0, 90.78], [96.0, 96.36], [98.0, 99.1], [100.0, 99.81], [100.0, 101.09], [107.0, 107.52], [108.0, 107.57], [110.0, 111.11], [112.0, 112.89], [115.0, 116.92], [118.0, 118.77], [122.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.96, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 84.98, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 44.54], ["owl", 5.69], ["hoot", 4.19]], null, null, null, [["whale vocalization", 72.81], ["speech", 14.06], ["sidetone", 1.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 2.3, 0.1, 2.26, 0.4, 1.93, 0.76, 0.68, 2.52, 0.84, 1.77, 2.79, 5.57, 0.85, 1.16, 0.25, 0.38, 0.19, 1.03, 0.88, 0.92, 0.78, 0.36, 1.1, -0.19, 1.09, 0.52, -0.43, 1.11, 0.89, 1.92, 0.77, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/fQy1yr_K_L4_filtered.json b/annotations_filtered/fQy1yr_K_L4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1ecf2ee095215472356a3603ace580dda91e337 --- /dev/null +++ b/annotations_filtered/fQy1yr_K_L4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.61], [8.0, 11.2], [13.0, 15.94], [18.0, 20.75], [23.0, 23.25], [24.0, 26.32], [31.0, 33.76], [35.0, 37.18], [38.0, 39.39], [41.0, 42.63], [44.0, 46.85], [50.0, 51.27], [52.0, 53.23], [55.0, 61.5], [63.0, 64.42], [65.0, 67.27], [68.0, 71.98], [75.0, 74.8], [75.0, 76.71], [78.0, 82.59], [83.0, 88.43], [89.0, 93.51], [94.0, 95.61], [96.0, 104.57], [106.0, 108.08], [109.0, 110.34], [113.0, 123.13], [125.0, 127.08], [128.0, 133.52], [135.0, 139.51], [141.0, 142.11], [143.0, 153.49], [155.0, 156.98], [158.0, 160.62], [162.0, 164.32], [167.0, 168.74], [170.0, 174.07], [175.0, 178.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 100.0, 99.99, 100.0, 0.0, 98.36, 99.88, 99.95, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 91.3, 99.96, 0.0, 0.0, 99.36, 78.72, 98.27, 0.0, 77.36, 99.92, 0.0, 99.52, 99.78, 85.35, 86.45, 0.0, 98.66, 0.0, 99.36, 99.93, 0.0, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.61, 3.2, 2.94, 2.75, 0.25, 2.32, 2.76, 2.18, 1.39, 1.63, 2.85, 1.27, 1.23, 6.5, 1.42, 2.27, 3.98, -0.2, 1.71, 4.59, 5.43, 4.51, 1.61, 8.57, 2.08, 1.34, 10.13, 2.08, 5.52, 4.51, 1.11, 10.49, 1.98, 2.62, 2.32, 1.74, 4.07, 3.95]} \ No newline at end of file diff --git a/annotations_filtered/fR0Sh0C6jFE_filtered.json b/annotations_filtered/fR0Sh0C6jFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4018d21d5634d41faf441b433b373045e6fe11ae --- /dev/null +++ b/annotations_filtered/fR0Sh0C6jFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.61], [37.0, 36.64], [37.0, 36.68], [37.0, 36.75]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.61, -0.36, -0.32, -0.25]} \ No newline at end of file diff --git a/annotations_filtered/fRF7InV7TfI_filtered.json b/annotations_filtered/fRF7InV7TfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e6cd9b44438477cb8181a72642230b9a8b90eda --- /dev/null +++ b/annotations_filtered/fRF7InV7TfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.37], [28.0, 28.41], [32.0, 33.29], [33.0, 33.35], [39.0, 40.09], [50.0, 51.61], [53.0, 54.13], [57.0, 57.81], [62.0, 64.35], [66.0, 66.36], [67.0, 68.99], [70.0, 70.93], [74.0, 80.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 31.74], "audiomae_on_audioset": [[["cattle, bovinae", 28.33], ["livestock, farm animals, working animals", 26.6], ["moo", 18.98]], null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 22.45], ["livestock, farm animals, working animals", 17.5], ["music", 16.89]]], "duration": [2.37, 0.41, 1.29, 0.35, 1.09, 1.61, 1.13, 0.81, 2.35, 0.36, 1.99, 0.93, 6.89]} \ No newline at end of file diff --git a/annotations_filtered/fRNR8-FqzM4_filtered.json b/annotations_filtered/fRNR8-FqzM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc5956a6e446c09349dac6702e0270054f8e573f --- /dev/null +++ b/annotations_filtered/fRNR8-FqzM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 34.5], [38.0, 38.13], [65.0, 66.5], [72.0, 74.14], [85.0, 85.83], [87.0, 87.17], [92.0, 92.82], [101.0, 103.71], [116.0, 116.43]], "keep_status": [true, false, false, false, false, false, false, true, false], "silence_prob": [31.74, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 35.67, 0.0], "audiomae_on_audioset": [[["hum", 26.26], ["theremin", 17.57], ["music", 17.3]], null, null, [["music", 80.4], ["guitar", 6.32], ["musical instrument", 4.4]], null, null, null, [["music", 52.61], ["effects unit", 10.0], ["distortion", 4.73]], null], "duration": [10.5, 0.13, 1.5, 2.14, 0.83, 0.17, 0.82, 2.71, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/fRQsuCJ-g4I_filtered.json b/annotations_filtered/fRQsuCJ-g4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f1f02af66c4904d17d00392e823184b6c270a9f --- /dev/null +++ b/annotations_filtered/fRQsuCJ-g4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.03], [8.0, 11.16], [13.0, 13.98], [16.0, 16.19], [20.0, 20.24], [23.0, 23.8], [25.0, 25.86], [29.0, 31.13], [32.0, 33.74], [35.0, 37.56], [39.0, 40.27], [41.0, 45.4], [49.0, 54.72], [55.0, 57.27], [58.0, 58.92], [61.0, 62.14], [64.0, 64.27], [67.0, 67.71], [69.0, 70.55], [73.0, 74.44], [75.0, 102.09], [103.0, 108.23], [110.0, 122.17], [123.0, 124.19], [125.0, 127.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 98.73, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.8, 100.0, 0.0, 99.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.03, 3.16, 0.98, 0.19, 0.24, 0.8, 0.86, 2.13, 1.74, 2.56, 1.27, 4.4, 5.72, 2.27, 0.92, 1.14, 0.27, 0.71, 1.55, 1.44, 27.09, 5.23, 12.17, 1.19, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/fRhJPuDCXRk_filtered.json b/annotations_filtered/fRhJPuDCXRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b73f458814b0da0ccb426a6806b7c88f138f791b --- /dev/null +++ b/annotations_filtered/fRhJPuDCXRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [5.0, 5.22], [9.0, 14.82], [19.0, 20.88], [22.0, 22.4], [23.0, 25.71], [26.0, 28.53], [33.0, 35.13], [37.0, 41.01], [42.0, 48.36], [49.0, 51.0], [53.0, 53.32], [55.0, 56.03], [57.0, 59.17], [59.0, 60.56], [63.0, 63.42], [65.0, 66.11], [79.0, 80.37], [91.0, 97.5], [101.0, 101.17], [102.0, 102.51], [113.0, 113.0], [115.0, 115.4], [115.0, 115.5], [116.0, 115.62], [121.0, 122.0], [128.0, 128.01], [133.0, 132.95], [136.0, 139.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.42, 0.0, 0.0, 74.6, 99.82, 99.4, 86.09, 31.02, 33.14, 0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 36.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 28.59], ["hum", 17.22], ["electric shaver, electric razor", 9.88]], [["music", 63.77], ["didgeridoo", 7.17], ["musical instrument", 2.95]], null, null, [["music", 67.4], ["throbbing", 2.79], ["guitar", 1.63]], null, null, null, null, [["music", 65.1], ["throbbing", 3.96], ["musical instrument", 2.29]], null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.22, 5.82, 1.88, 0.4, 2.71, 2.53, 2.13, 4.01, 6.36, 2.0, 0.32, 1.03, 2.17, 1.56, 0.42, 1.11, 1.37, 6.5, 0.17, 0.51, 0.0, 0.4, 0.5, -0.38, 1.0, 0.01, -0.05, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/fSNdh-3k6-g_filtered.json b/annotations_filtered/fSNdh-3k6-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f34aea42edc612a8df1d64f72ced507c74ed8b9 --- /dev/null +++ b/annotations_filtered/fSNdh-3k6-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.67], [8.0, 14.59], [17.0, 17.39], [19.0, 35.99], [37.0, 38.92], [40.0, 123.45]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 34.89, 0.0, 32.79, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.45], ["synthesizer", 3.54], ["musical instrument", 2.55]], null, [["music", 83.88], ["synthesizer", 2.63], ["musical instrument", 2.15]], null, null], "duration": [0.67, 6.59, 0.39, 16.99, 1.92, 83.45]} \ No newline at end of file diff --git a/annotations_filtered/fSOh-vTjWk4_filtered.json b/annotations_filtered/fSOh-vTjWk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37dd8a45364b24a98288eada0e33134a532bc097 --- /dev/null +++ b/annotations_filtered/fSOh-vTjWk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [8.0, 8.58], [10.0, 13.0], [16.0, 18.0], [19.0, 20.6], [21.0, 26.59], [28.0, 30.23], [32.0, 34.55], [35.0, 39.28], [41.0, 41.62], [44.0, 44.81], [46.0, 65.35], [66.0, 67.88], [70.0, 70.14], [73.0, 74.17], [77.0, 77.25], [79.0, 95.71], [96.0, 98.56], [101.0, 106.42], [110.0, 110.47], [111.0, 114.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 83.16, 0.0, 70.02, 96.04, 98.19, 93.6, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 92.31, 93.6, 88.46, 0.0, 57.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.58, 3.0, 2.0, 1.6, 5.59, 2.23, 2.55, 4.28, 0.62, 0.81, 19.35, 1.88, 0.14, 1.17, 0.25, 16.71, 2.56, 5.42, 0.47, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/fSqvtspQonw_filtered.json b/annotations_filtered/fSqvtspQonw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..550c3a50fde33cb14e3b3c3e73e0f4341ddb631e --- /dev/null +++ b/annotations_filtered/fSqvtspQonw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [2.0, 4.02], [5.0, 6.91], [8.0, 8.29], [9.0, 10.67], [12.0, 12.92], [17.0, 18.87], [21.0, 21.64], [26.0, 27.36], [33.0, 35.87], [37.0, 38.18], [43.0, 43.78], [47.0, 46.89], [48.0, 49.6], [52.0, 53.81], [54.0, 54.78], [57.0, 58.73], [61.0, 62.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 2.02, 1.91, 0.29, 1.67, 0.92, 1.87, 0.64, 1.36, 2.87, 1.18, 0.78, -0.11, 1.6, 1.81, 0.78, 1.73, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/fSu5W0BtXG8_filtered.json b/annotations_filtered/fSu5W0BtXG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f2d51ed5bbce80a82e01a4471d7a90f9100b264 --- /dev/null +++ b/annotations_filtered/fSu5W0BtXG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.33], [15.0, 16.43], [17.0, 19.74], [21.0, 20.85], [22.0, 21.71], [22.0, 25.25], [26.0, 27.23], [27.0, 27.73], [29.0, 30.16], [37.0, 37.74], [38.0, 38.2], [38.0, 38.67], [47.0, 50.11], [50.0, 51.24], [52.0, 52.86], [54.0, 54.4], [55.0, 63.02], [68.0, 75.9], [76.0, 76.25], [77.0, 80.11], [80.0, 82.73], [83.0, 85.68], [87.0, 87.79], [89.0, 90.07], [91.0, 95.27], [97.0, 97.09], [98.0, 101.6], [102.0, 103.0], [104.0, 104.48], [105.0, 124.93], [126.0, 126.45], [127.0, 127.72], [129.0, 130.25], [132.0, 132.95], [136.0, 142.79]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [49.09, 0.0, 42.69, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 60.14, 92.97, 0.0, 81.17, 71.29, 67.89, 0.0, 0.0, 40.06, 0.0, 43.56, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 43.58], "audiomae_on_audioset": [[["moo", 24.08], ["cattle, bovinae", 19.62], ["speech", 9.2]], null, [["music", 25.4], ["speech", 20.68], ["sound effect", 4.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["wail, moan", 50.47], ["crying, sobbing", 12.62], ["groan", 8.46]], null, [["fart", 35.44], ["cough", 14.0], ["ping", 4.08]], null, null, null, null, null, null, null, [["whistling", 62.93], ["speech", 9.28], ["whistle", 2.24]]], "duration": [5.33, 1.43, 2.74, -0.15, -0.29, 3.25, 1.23, 0.73, 1.16, 0.74, 0.2, 0.67, 3.11, 1.24, 0.86, 0.4, 8.02, 7.9, 0.25, 3.11, 2.73, 2.68, 0.79, 1.07, 4.27, 0.09, 3.6, 1.0, 0.48, 19.93, 0.45, 0.72, 1.25, 0.95, 6.79]} \ No newline at end of file diff --git a/annotations_filtered/fTIIhYZ_CzA_filtered.json b/annotations_filtered/fTIIhYZ_CzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b34f27f4a4564afd371543d87392ff6a6b2dbdae --- /dev/null +++ b/annotations_filtered/fTIIhYZ_CzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.77], [14.0, 25.03], [27.0, 27.6], [43.0, 53.03], [54.0, 59.43], [62.0, 65.1], [66.0, 67.81], [69.0, 68.89], [69.0, 70.36], [73.0, 82.07], [83.0, 85.35], [87.0, 88.32], [95.0, 100.8], [101.0, 104.31], [104.0, 114.37], [116.0, 132.6]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [40.99, 41.22, 0.0, 38.64, 36.6, 38.93, 0.0, 0.0, 0.0, 34.14, 31.92, 0.0, 31.16, 30.06, 31.54, 31.85], "audiomae_on_audioset": [[["heart sounds, heartbeat", 38.86], ["throbbing", 30.1], ["hum", 10.3]], [["hum", 54.25], ["mains hum", 16.09], ["throbbing", 12.92]], null, [["hum", 46.79], ["mains hum", 21.58], ["throbbing", 8.74]], [["speech", 70.82], ["sidetone", 8.4], ["hum", 7.31]], [["hum", 32.69], ["throbbing", 23.95], ["gong", 9.99]], null, null, null, [["hum", 55.86], ["mains hum", 16.49], ["throbbing", 15.61]], [["sidetone", 74.72], ["speech", 16.61], ["music", 1.51]], null, [["throbbing", 37.33], ["hum", 33.65], ["sidetone", 11.07]], [["speech", 24.81], ["hum", 19.09], ["throbbing", 15.71]], [["speech", 44.67], ["hum", 16.06], ["gong", 15.62]], [["hum", 37.52], ["sidetone", 21.93], ["mains hum", 20.06]]], "duration": [4.77, 11.03, 0.6, 10.03, 5.43, 3.1, 1.81, -0.11, 1.36, 9.07, 2.35, 1.32, 5.8, 3.31, 10.37, 16.6]} \ No newline at end of file diff --git a/annotations_filtered/fTMY9OkzTBA_filtered.json b/annotations_filtered/fTMY9OkzTBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcfc9bbe5d46e92c9a732a5087577f9dff1a6fae --- /dev/null +++ b/annotations_filtered/fTMY9OkzTBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 70.51], [71.0, 72.44], [74.0, 74.02], [77.0, 77.19], [81.0, 81.38], [81.0, 116.53], [118.0, 119.7], [121.0, 121.78]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [6.51, 1.44, 0.02, 0.19, 0.38, 35.53, 1.7, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/fU-ICxohwSc_filtered.json b/annotations_filtered/fU-ICxohwSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d281921beffc674291306ffe49f2bc553ed19ee0 --- /dev/null +++ b/annotations_filtered/fU-ICxohwSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.06], [5.0, 12.02], [14.0, 28.43], [29.0, 29.07], [30.0, 44.07], [45.0, 47.38], [49.0, 51.39], [53.0, 54.38], [55.0, 56.67], [58.0, 58.6], [61.0, 61.82], [64.0, 64.57], [67.0, 70.65], [72.0, 72.5], [74.0, 84.23], [86.0, 86.7], [88.0, 88.77], [91.0, 96.52]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [73.21, 53.72, 59.07, 0.0, 46.57, 51.99, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 37.0, 0.0, 0.0, 30.84], "audiomae_on_audioset": [null, null, null, null, [["music", 32.42], ["hum", 14.19], ["synthesizer", 11.92]], null, null, null, null, null, null, null, null, null, [["music", 15.9], ["frog", 13.32], ["hum", 5.14]], null, null, [["music", 32.27], ["explosion", 13.93], ["speech", 8.38]]], "duration": [2.06, 7.02, 14.43, 0.07, 14.07, 2.38, 2.39, 1.38, 1.67, 0.6, 0.82, 0.57, 3.65, 0.5, 10.23, 0.7, 0.77, 5.52]} \ No newline at end of file diff --git a/annotations_filtered/fUKoBAi7qCg_filtered.json b/annotations_filtered/fUKoBAi7qCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e58d5935c3bffc3cda6d7ae817493ad57200461e --- /dev/null +++ b/annotations_filtered/fUKoBAi7qCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.59], [4.0, 5.54], [6.0, 13.05], [15.0, 15.16], [15.0, 23.03], [24.0, 24.71], [26.0, 75.22], [77.0, 88.87], [89.0, 94.17], [96.0, 101.46], [104.0, 122.88]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.9, 0.0, 28.43, 0.0, 0.0, 30.5, 30.02, 39.64, 32.72], "audiomae_on_audioset": [null, null, [["music", 50.77], ["speech", 25.56], ["theremin", 8.33]], null, [["music", 60.01], ["speech", 22.11], ["throbbing", 2.65]], null, null, [["music", 85.66], ["theremin", 1.3], ["didgeridoo", 1.24]], [["livestock, farm animals, working animals", 38.36], ["cattle, bovinae", 14.95], ["moo", 11.39]], [["music", 53.03], ["musical instrument", 4.94], ["guitar", 2.7]], [["music", 55.0], ["theremin", 9.88], ["synthesizer", 6.89]]], "duration": [1.59, 1.54, 7.05, 0.16, 8.03, 0.71, 49.22, 11.87, 5.17, 5.46, 18.88]} \ No newline at end of file diff --git a/annotations_filtered/fUlMUkd7IWU_filtered.json b/annotations_filtered/fUlMUkd7IWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3880f1334457831cd475d1e1b7da8b24fcb93462 --- /dev/null +++ b/annotations_filtered/fUlMUkd7IWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 31.26], [37.0, 65.37], [69.0, 93.12], [95.0, 104.25], [109.0, 109.56], [110.0, 113.83], [115.0, 125.22], [128.0, 131.63], [132.0, 137.91], [138.0, 138.38], [143.0, 158.16], [161.0, 162.5], [164.0, 175.09]], "keep_status": [true, true, false, true, false, true, true, true, true, false, true, false, true], "silence_prob": [30.79, 32.93, 35.35, 33.73, 0.0, 31.46, 31.46, 31.03, 31.24, 0.0, 31.56, 0.0, 32.46], "audiomae_on_audioset": [[["speech", 21.02], ["vehicle", 12.44], ["buzz", 11.61]], [["speech", 20.76], ["music", 16.13], ["cattle, bovinae", 7.46]], [["music", 45.48], ["speech", 27.17], ["hum", 2.93]], [["music", 48.7], ["speech", 12.31], ["musical instrument", 5.66]], null, [["speech", 46.35], ["music", 12.58], ["thump, thud", 5.04]], [["speech", 30.09], ["music", 20.68], ["hum", 15.13]], [["music", 18.78], ["speech", 17.95], ["smash, crash", 13.26]], [["speech", 45.37], ["music", 8.14], ["whack, thwack", 5.17]], null, [["speech", 43.81], ["music", 14.1], ["smash, crash", 8.38]], null, [["speech", 28.57], ["machine gun", 22.71], ["music", 13.41]]], "duration": [19.26, 28.37, 24.12, 9.25, 0.56, 3.83, 10.22, 3.63, 5.91, 0.38, 15.16, 1.5, 11.09]} \ No newline at end of file diff --git a/annotations_filtered/fV-wb1gZOyo_filtered.json b/annotations_filtered/fV-wb1gZOyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131354adf53f14861a9c613adf076c9df2f1dfe0 --- /dev/null +++ b/annotations_filtered/fV-wb1gZOyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.33], [8.0, 9.05], [11.0, 13.54], [15.0, 16.33], [19.0, 19.01], [20.0, 24.04], [26.0, 28.66], [29.0, 34.47], [35.0, 39.09], [41.0, 42.9], [44.0, 47.43], [48.0, 51.92], [52.0, 67.26], [68.0, 70.02], [72.0, 71.68], [73.0, 73.72], [76.0, 75.69], [78.0, 80.37], [80.0, 81.72], [84.0, 84.57], [86.0, 86.17], [87.0, 88.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 99.44, 0.0, 0.0, 96.77, 90.95, 84.8, 95.51, 0.0, 77.2, 47.98, 33.82, 34.31, 0.0, 0.0, 0.0, 31.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 46.76], ["speech", 17.72], ["theremin", 7.33]], [["music", 61.31], ["hum", 7.63], ["theremin", 4.47]], [["music", 28.22], ["didgeridoo", 25.84], ["speech", 4.7]], null, null, null, [["speech", 51.95], ["mains hum", 11.62], ["radio", 7.1]], null, null, null, null], "duration": [5.33, 1.05, 2.54, 1.33, 0.01, 4.04, 2.66, 5.47, 4.09, 1.9, 3.43, 3.92, 15.26, 2.02, -0.32, 0.72, -0.31, 2.37, 1.72, 0.57, 0.17, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/fVVoh_Xh0xo_filtered.json b/annotations_filtered/fVVoh_Xh0xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c86b4ba478745f905f73c723cf57ed22e8362e8e --- /dev/null +++ b/annotations_filtered/fVVoh_Xh0xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [5.0, 5.37], [14.0, 17.61], [20.0, 20.38], [36.0, 39.26], [40.0, 42.96], [46.0, 49.98], [51.0, 53.0], [55.0, 57.23], [63.0, 64.83], [66.0, 71.07], [72.0, 74.34], [76.0, 77.67], [79.0, 79.52], [80.0, 80.89], [82.0, 83.08], [85.0, 86.05], [88.0, 89.7], [91.0, 92.28], [93.0, 93.18], [94.0, 94.78], [98.0, 100.9], [102.0, 103.32], [105.0, 106.35], [107.0, 107.81], [109.0, 110.25], [111.0, 112.36], [113.0, 115.08], [116.0, 117.04], [121.0, 123.45], [129.0, 135.46], [139.0, 143.95], [145.0, 145.93], [150.0, 150.92]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.24, 0.0, 33.98, 29.92, 30.37, 99.93, 42.24, 0.0, 43.48, 57.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 0.0, 30.37, 31.59, 31.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.79], ["musical instrument", 2.91], ["throbbing", 2.56]], null, [["music", 49.7], ["speech", 26.47], ["boing", 5.09]], [["music", 77.47], ["guitar", 2.0], ["musical instrument", 1.81]], [["music", 27.49], ["sound effect", 12.46], ["musical instrument", 10.02]], null, [["music", 34.55], ["tap", 7.45], ["throbbing", 6.97]], null, [["speech", 46.56], ["music", 26.84], ["theremin", 3.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.33], ["techno", 5.62], ["electronic music", 5.51]], null, [["music", 72.59], ["electronic music", 4.82], ["speech", 4.02]], [["music", 38.88], ["sidetone", 34.1], ["throbbing", 6.34]], [["music", 49.09], ["sidetone", 14.65], ["speech", 7.47]], null, null], "duration": [0.23, 0.37, 3.61, 0.38, 3.26, 2.96, 3.98, 2.0, 2.23, 1.83, 5.07, 2.34, 1.67, 0.52, 0.89, 1.08, 1.05, 1.7, 1.28, 0.18, 0.78, 2.9, 1.32, 1.35, 0.81, 1.25, 1.36, 2.08, 1.04, 2.45, 6.46, 4.95, 0.93, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/fVltuJq1SQ8_filtered.json b/annotations_filtered/fVltuJq1SQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2f1fec45bfa4e50e0a92889e93fd5c2f7b2edc7 --- /dev/null +++ b/annotations_filtered/fVltuJq1SQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [11.0, 14.57], [15.0, 16.8], [18.0, 22.86], [24.0, 28.98], [30.0, 32.24]], "keep_status": [false, true, false, false, false, true], "silence_prob": [0.0, 47.43, 0.0, 56.1, 50.61, 39.7], "audiomae_on_audioset": [null, [["music", 33.65], ["hum", 17.83], ["throbbing", 7.97]], null, null, null, [["music", 47.44], ["hum", 9.05], ["mains hum", 5.8]]], "duration": [0.45, 3.57, 1.8, 4.86, 4.98, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/fVoHEZb6imE_filtered.json b/annotations_filtered/fVoHEZb6imE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6922225ae5d55b27f2781b328ae43c692b2f5d3 --- /dev/null +++ b/annotations_filtered/fVoHEZb6imE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 37.25], [38.0, 43.75], [45.0, 60.99], [63.0, 63.27], [65.0, 65.89], [71.0, 72.49]], "keep_status": [true, false, true, false, false, false], "silence_prob": [44.63, 58.81, 45.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.76], ["electronic music", 3.52], ["thunk", 2.4]], null, [["music", 38.07], ["hum", 20.5], ["rumble", 9.94]], null, null, null], "duration": [5.25, 5.75, 15.99, 0.27, 0.89, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/fWBAKMYKPSc_filtered.json b/annotations_filtered/fWBAKMYKPSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cada78043ae2a5664936ae3f2877ec0d60a1b0c --- /dev/null +++ b/annotations_filtered/fWBAKMYKPSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [4.0, 7.65], [8.0, 11.97], [13.0, 14.12], [15.0, 16.55], [17.0, 17.51], [18.0, 18.55], [21.0, 21.54], [30.0, 30.59], [40.0, 40.19], [55.0, 54.92], [60.0, 60.96], [64.0, 64.34], [80.0, 80.7], [94.0, 93.83], [99.0, 99.37], [102.0, 101.95], [104.0, 103.99], [119.0, 119.38], [120.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.0, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 3.65, 3.97, 1.12, 1.55, 0.51, 0.55, 0.54, 0.59, 0.19, -0.08, 0.96, 0.34, 0.7, -0.17, 0.37, -0.05, -0.01, 0.38, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/fWP17t95S2k_filtered.json b/annotations_filtered/fWP17t95S2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdfe350865a6ec02b52e9195c9dc2dbc6691d47e --- /dev/null +++ b/annotations_filtered/fWP17t95S2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.8], [30.0, 30.64], [41.0, 42.13], [45.0, 52.91], [54.0, 65.21], [74.0, 90.71], [94.0, 113.27], [116.0, 118.94]], "keep_status": [false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 41.22, 34.64, 32.59, 32.23, 35.05], "audiomae_on_audioset": [null, null, null, [["speech", 47.54], ["whale vocalization", 19.82], ["hum", 8.56]], [["eruption", 27.54], ["speech", 26.51], ["explosion", 10.6]], [["speech", 48.12], ["hum", 8.35], ["explosion", 5.26]], [["speech", 29.88], ["hum", 17.64], ["sidetone", 15.29]], [["throbbing", 46.36], ["hum", 37.23], ["music", 4.84]]], "duration": [0.8, 0.64, 1.13, 7.91, 11.21, 16.71, 19.27, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/fWPRhRM1V7I_filtered.json b/annotations_filtered/fWPRhRM1V7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4be6d7b14451e6b5cb77d497db5f3f4648c08408 --- /dev/null +++ b/annotations_filtered/fWPRhRM1V7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.32], [20.0, 22.03], [23.0, 23.11], [27.0, 27.48], [28.0, 31.28], [32.0, 32.17], [37.0, 37.94], [49.0, 49.05], [55.0, 58.13], [60.0, 63.51], [64.0, 67.31], [68.0, 76.96], [83.0, 84.0], [86.0, 94.36], [97.0, 98.14], [104.0, 104.13], [108.0, 108.33], [110.0, 110.89], [112.0, 113.22], [115.0, 116.61], [118.0, 122.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.73, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 100.0, 98.73, 100.0, 96.66, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 2.03, 0.11, 0.48, 3.28, 0.17, 0.94, 0.05, 3.13, 3.51, 3.31, 8.96, 1.0, 8.36, 1.14, 0.13, 0.33, 0.89, 1.22, 1.61, 4.2]} \ No newline at end of file diff --git a/annotations_filtered/fWYs-bFK9_s_filtered.json b/annotations_filtered/fWYs-bFK9_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07b2516216cd201a24ace86c057e398a2ca66433 --- /dev/null +++ b/annotations_filtered/fWYs-bFK9_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.96], [18.0, 30.13], [34.0, 34.84], [42.0, 60.99], [70.0, 70.71], [99.0, 121.07], [122.0, 124.41], [141.0, 141.4], [141.0, 141.47], [144.0, 147.88], [149.0, 150.5]], "keep_status": [false, true, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 31.93, 0.0, 33.0, 0.0, 31.93, 33.19, 0.0, 0.0, 32.53, 0.0], "audiomae_on_audioset": [null, [["speech", 36.99], ["vehicle", 15.41], ["boat, water vehicle", 6.17]], null, [["speech", 56.19], ["buzz", 11.3], ["vehicle", 8.0]], null, [["speech", 52.64], ["vehicle", 10.7], ["boat, water vehicle", 4.89]], [["speech", 47.27], ["vehicle", 5.97], ["music", 4.49]], null, null, [["speech", 32.66], ["explosion", 13.71], ["buzz", 6.16]], null], "duration": [0.96, 12.13, 0.84, 18.99, 0.71, 22.07, 2.41, 0.4, 0.47, 3.88, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/fWa-h0maM1w_filtered.json b/annotations_filtered/fWa-h0maM1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a30f406f4a85f792031c3d791c5ef14af85b8c2c --- /dev/null +++ b/annotations_filtered/fWa-h0maM1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [20.0, 20.71], [23.0, 23.55], [25.0, 25.07], [26.0, 26.86], [44.0, 43.85], [46.0, 46.35], [52.0, 52.2], [53.0, 53.65], [57.0, 58.41], [68.0, 78.58], [89.0, 89.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 60.01], ["hum", 10.35], ["didgeridoo", 5.0]], null], "duration": [0.4, 0.71, 0.55, 0.07, 0.86, -0.15, 0.35, 0.2, 0.65, 1.41, 10.58, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/fWcPwWR4C_w_filtered.json b/annotations_filtered/fWcPwWR4C_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..872f0fa6c5a07391a7ff185408abd36ffa39f0d5 --- /dev/null +++ b/annotations_filtered/fWcPwWR4C_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.04], [14.0, 37.3], [40.0, 56.79], [58.0, 68.91], [75.0, 79.51], [82.0, 82.48], [82.0, 82.51], [84.0, 106.84], [109.0, 127.36]], "keep_status": [false, true, false, true, false, false, false, false, false], "silence_prob": [38.49, 34.75, 35.22, 34.46, 33.28, 0.0, 0.0, 33.29, 35.91], "audiomae_on_audioset": [[["hum", 57.1], ["throbbing", 18.44], ["mains hum", 12.81]], [["music", 21.23], ["hum", 21.09], ["mains hum", 9.04]], [["sidetone", 38.0], ["speech", 27.53], ["hum", 9.77]], [["sidetone", 51.38], ["music", 10.16], ["whack, thwack", 5.45]], [["music", 35.34], ["speech", 34.84], ["hum", 5.16]], null, null, [["music", 79.14], ["synthesizer", 5.76], ["electronic music", 3.26]], [["music", 66.25], ["hum", 7.5], ["ambient music", 4.53]]], "duration": [3.04, 23.3, 16.79, 10.91, 4.51, 0.48, 0.51, 22.84, 18.36]} \ No newline at end of file diff --git a/annotations_filtered/fWgpZ_2oYfE_filtered.json b/annotations_filtered/fWgpZ_2oYfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bc3eb39c85b91bd61ad71051b50b856e64ec146 --- /dev/null +++ b/annotations_filtered/fWgpZ_2oYfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.63], [20.0, 21.29], [24.0, 37.05], [40.0, 66.14]], "keep_status": [false, false, false, true], "silence_prob": [32.41, 0.0, 31.48, 29.79], "audiomae_on_audioset": [[["speech", 66.16], ["foghorn", 3.84], ["outside, urban or manmade", 3.12]], null, [["speech", 57.54], ["electric shaver, electric razor", 11.74], ["buzz", 10.17]], [["speech", 45.91], ["music", 7.44], ["hubbub, speech noise, speech babble", 7.16]]], "duration": [2.63, 1.29, 13.05, 26.14]} \ No newline at end of file diff --git a/annotations_filtered/fWqnZTTRkm4_filtered.json b/annotations_filtered/fWqnZTTRkm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e03291bf0629148f59a7d00f30488c61826c606c --- /dev/null +++ b/annotations_filtered/fWqnZTTRkm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.5], [31.0, 49.17], [52.0, 81.72], [83.0, 82.92], [84.0, 85.63], [94.0, 102.34], [107.0, 108.99]], "keep_status": [false, false, true, false, false, true, false], "silence_prob": [0.0, 31.24, 32.71, 0.0, 0.0, 31.49, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 62.91], ["mosquito", 8.33], ["fly, housefly", 7.22]], [["boing", 35.65], ["whack, thwack", 15.49], ["speech", 14.84]], null, null, [["music", 33.0], ["mosquito", 9.98], ["buzz", 5.63]], null], "duration": [0.5, 18.17, 29.72, -0.08, 1.63, 8.34, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/fWx9V0xoYsI_filtered.json b/annotations_filtered/fWx9V0xoYsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00bd38e26b05204a24e9b6032b90df8b9f2dbb6d --- /dev/null +++ b/annotations_filtered/fWx9V0xoYsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.75], [38.0, 38.58], [39.0, 40.51], [42.0, 41.86], [42.0, 43.36], [46.0, 46.09], [47.0, 47.55], [53.0, 54.46], [57.0, 58.62], [59.0, 60.0], [61.0, 63.39], [66.0, 67.31], [68.0, 68.77], [69.0, 69.74], [71.0, 72.22], [78.0, 79.05], [81.0, 81.55], [83.0, 83.13], [85.0, 88.59], [90.0, 91.62], [93.0, 94.05], [97.0, 98.17], [101.0, 101.34], [104.0, 104.03], [107.0, 108.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 0.58, 1.51, -0.14, 1.36, 0.09, 0.55, 1.46, 1.62, 1.0, 2.39, 1.31, 0.77, 0.74, 1.22, 1.05, 0.55, 0.13, 3.59, 1.62, 1.05, 1.17, 0.34, 0.03, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/fWxKQF17YHk_filtered.json b/annotations_filtered/fWxKQF17YHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4062adaee242ffd77b8440c62dcb4ac90291ca4 --- /dev/null +++ b/annotations_filtered/fWxKQF17YHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.12], [14.0, 16.41], [18.0, 19.68], [23.0, 24.63], [25.0, 26.84], [28.0, 29.89], [31.0, 33.52], [35.0, 38.25], [40.0, 44.39], [45.0, 47.78], [49.0, 53.94], [56.0, 60.59], [63.0, 65.42], [66.0, 67.66], [68.0, 71.59], [73.0, 81.5], [82.0, 84.6], [85.0, 87.59], [89.0, 89.36], [90.0, 92.97], [97.0, 98.37], [99.0, 103.86], [108.0, 109.56], [112.0, 113.51], [117.0, 118.91], [120.0, 122.94], [125.0, 127.6], [128.0, 128.6], [130.0, 139.31], [140.0, 145.18], [147.0, 153.67], [156.0, 155.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 99.98, 0.0, 0.0, 0.0, 0.0, 97.43, 99.88, 97.73, 99.95, 99.99, 99.8, 99.98, 0.0, 95.51, 99.99, 97.54, 95.09, 0.0, 97.11, 0.0, 42.15, 0.0, 0.0, 0.0, 94.52, 90.6, 0.0, 96.66, 97.83, 97.33, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.18], ["hammer", 9.12], ["whack, thwack", 8.17]], null, null, null, null, null, null, null, null, null, null], "duration": [2.12, 2.41, 1.68, 1.63, 1.84, 1.89, 2.52, 3.25, 4.39, 2.78, 4.94, 4.59, 2.42, 1.66, 3.59, 8.5, 2.6, 2.59, 0.36, 2.97, 1.37, 4.86, 1.56, 1.51, 1.91, 2.94, 2.6, 0.6, 9.31, 5.18, 6.67, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/fX4XAbCTdYs_filtered.json b/annotations_filtered/fX4XAbCTdYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cd17b90e9164614de49e455772f8aa37d730536 --- /dev/null +++ b/annotations_filtered/fX4XAbCTdYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 62.7], [64.0, 64.45], [66.0, 68.42], [74.0, 77.43], [80.0, 80.45], [81.0, 83.1], [89.0, 89.51], [105.0, 110.73], [112.0, 112.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 92.8, 43.53, 0.0, 62.99, 0.0, 96.54, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 57.17], ["thunk", 16.22], ["boing", 5.48]], null, null, null, null, null], "duration": [0.7, 0.45, 2.42, 3.43, 0.45, 2.1, 0.51, 5.73, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/fXBsUOysL3c_filtered.json b/annotations_filtered/fXBsUOysL3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7163721d9bf7ff00e30d41a84a0c895888700191 --- /dev/null +++ b/annotations_filtered/fXBsUOysL3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.92], [33.0, 36.32], [41.0, 40.98], [43.0, 42.55], [47.0, 46.63], [99.0, 99.15]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.08, 3.32, -0.02, -0.45, -0.37, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/fXXmeP9TvBg_filtered.json b/annotations_filtered/fXXmeP9TvBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29259f6d61d4a5da9e248da5da6ba77fa6702294 --- /dev/null +++ b/annotations_filtered/fXXmeP9TvBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 29.0], [33.0, 63.14], [63.0, 63.44], [64.0, 65.35], [72.0, 80.43], [82.0, 82.04], [82.0, 91.02], [93.0, 94.42], [98.0, 98.59], [101.0, 102.41], [106.0, 113.04], [118.0, 125.12], [135.0, 136.98], [137.0, 137.93], [141.0, 149.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.63, 0.0, 0.0, 0.0, 30.82, 0.0, 30.96, 0.0, 0.0, 0.0, 30.73, 31.13, 0.0, 0.0, 31.0], "audiomae_on_audioset": [[["music", 82.42], ["sidetone", 2.81], ["sampler", 2.71]], null, null, null, [["music", 92.72], ["musical instrument", 1.17], ["swing music", 0.5]], null, [["music", 70.16], ["funk", 6.33], ["disco", 2.62]], null, null, null, [["music", 87.83], ["musical instrument", 1.01], ["brass instrument", 0.47]], [["music", 75.39], ["swing music", 5.71], ["funk", 1.62]], null, null, [["music", 88.73], ["musical instrument", 1.82], ["singing", 0.8]]], "duration": [12.0, 30.14, 0.44, 1.35, 8.43, 0.04, 9.02, 1.42, 0.59, 1.41, 7.04, 7.12, 1.98, 0.93, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/fXcQVdBqtaY_filtered.json b/annotations_filtered/fXcQVdBqtaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7717ef70b4748d18deb9beb83f52f623919e5f23 --- /dev/null +++ b/annotations_filtered/fXcQVdBqtaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 3.11], [7.0, 7.11], [10.0, 10.35], [12.0, 12.04], [13.0, 14.1], [15.0, 15.25], [17.0, 17.14]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.73, 0.11, 0.11, 0.35, 0.04, 1.1, 0.25, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/fY-Aprk4mtY_filtered.json b/annotations_filtered/fY-Aprk4mtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da0d92642d42007a3e31693bd2a699b176eb6997 --- /dev/null +++ b/annotations_filtered/fY-Aprk4mtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.03], [39.0, 44.1], [61.0, 88.38], [96.0, 101.04], [104.0, 104.18], [107.0, 107.97], [110.0, 115.16]], "keep_status": [false, false, true, true, false, false, true], "silence_prob": [0.0, 33.01, 32.28, 40.95, 0.0, 0.0, 48.14], "audiomae_on_audioset": [null, [["music", 61.12], ["didgeridoo", 7.68], ["speech", 6.54]], [["music", 41.39], ["hum", 10.67], ["throbbing", 8.88]], [["crushing", 21.93], ["whack, thwack", 13.13], ["breaking", 13.03]], null, null, [["music", 15.19], ["throbbing", 12.53], ["chirp tone", 8.57]]], "duration": [1.03, 5.1, 27.38, 5.04, 0.18, 0.97, 5.16]} \ No newline at end of file diff --git a/annotations_filtered/fYNZsz9o3Sg_filtered.json b/annotations_filtered/fYNZsz9o3Sg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8db0c38e4d02a5e93dde6fec96466fca0bbf88c --- /dev/null +++ b/annotations_filtered/fYNZsz9o3Sg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [2.0, 1.92], [14.0, 14.62], [26.0, 26.91], [40.0, 41.12], [42.0, 43.01], [44.0, 48.66], [50.0, 50.55], [66.0, 66.95], [67.0, 67.46], [68.0, 70.14], [71.0, 72.81], [76.0, 77.23], [91.0, 91.84], [99.0, 99.87], [102.0, 103.55], [104.0, 104.84], [105.0, 106.88], [108.0, 108.5], [110.0, 110.15], [112.0, 122.62], [123.0, 123.82], [125.0, 125.68], [137.0, 136.92], [138.0, 138.59], [139.0, 139.65], [141.0, 141.56], [145.0, 145.45], [149.0, 149.01], [153.0, 153.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, -0.08, 0.62, 0.91, 1.12, 1.01, 4.66, 0.55, 0.95, 0.46, 2.14, 1.81, 1.23, 0.84, 0.87, 1.55, 0.84, 1.88, 0.5, 0.15, 10.62, 0.82, 0.68, -0.08, 0.59, 0.65, 0.56, 0.45, 0.01, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/fYVAGoTb8w4_filtered.json b/annotations_filtered/fYVAGoTb8w4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdb3cb88578ec0736ada5743ffda2b1fff51db49 --- /dev/null +++ b/annotations_filtered/fYVAGoTb8w4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.34], [19.0, 26.54], [30.0, 31.48], [32.0, 39.51], [41.0, 41.35], [44.0, 44.15], [51.0, 51.39], [56.0, 57.11], [58.0, 59.05], [60.0, 63.0], [64.0, 64.3], [65.0, 66.06], [67.0, 67.46], [69.0, 69.26], [70.0, 77.89], [78.0, 79.91], [81.0, 81.5], [83.0, 121.14], [130.0, 132.16], [133.0, 137.17], [138.0, 144.24], [145.0, 175.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.29, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 99.98, 94.95, 82.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.24], ["music", 28.59], ["fly, housefly", 3.58]], null, null, null, null, null, null, null], "duration": [1.34, 7.54, 1.48, 7.51, 0.35, 0.15, 0.39, 1.11, 1.05, 3.0, 0.3, 1.06, 0.46, 0.26, 7.89, 1.91, 0.5, 38.14, 2.16, 4.17, 6.24, 30.58]} \ No newline at end of file diff --git a/annotations_filtered/fYb0fQOH11g_filtered.json b/annotations_filtered/fYb0fQOH11g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecfddf4da4f3c92481ddadb8ab62e706726a31fb --- /dev/null +++ b/annotations_filtered/fYb0fQOH11g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.38], [19.0, 19.41], [20.0, 22.15], [26.0, 26.52], [30.0, 30.13], [31.0, 32.85], [34.0, 37.03], [40.0, 40.07], [43.0, 47.38], [49.0, 55.38], [58.0, 59.76], [62.0, 151.78], [154.0, 167.83]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [31.35, 0.0, 42.39, 0.0, 0.0, 0.0, 33.85, 0.0, 41.42, 32.74, 0.0, 0.0, 32.95], "audiomae_on_audioset": [[["speech", 34.79], ["vehicle", 10.8], ["helicopter", 8.92]], null, [["music", 56.86], ["throbbing", 13.94], ["hum", 5.51]], null, null, null, [["speech", 33.44], ["music", 28.59], ["hum", 6.03]], null, [["music", 65.52], ["throbbing", 7.85], ["hum", 7.82]], [["mains hum", 48.85], ["hum", 41.88], ["music", 2.78]], null, null, [["music", 68.99], ["electronic music", 7.01], ["sonar", 5.88]]], "duration": [4.38, 0.41, 2.15, 0.52, 0.13, 1.85, 3.03, 0.07, 4.38, 6.38, 1.76, 89.78, 13.83]} \ No newline at end of file diff --git a/annotations_filtered/fYbbxzLGpbI_filtered.json b/annotations_filtered/fYbbxzLGpbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e6991e976c0b29344f5a8efdb9485a139ff5064 --- /dev/null +++ b/annotations_filtered/fYbbxzLGpbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.81], [15.0, 21.91], [24.0, 24.56], [27.0, 47.44], [51.0, 81.38], [83.0, 94.66], [96.0, 103.65], [105.0, 133.46], [134.0, 138.5], [139.0, 149.64]], "keep_status": [true, true, false, true, false, false, false, false, true, true], "silence_prob": [33.23, 28.61, 0.0, 28.3, 0.0, 28.31, 28.36, 28.43, 28.54, 28.32], "audiomae_on_audioset": [[["hum", 28.14], ["music", 14.98], ["throbbing", 11.9]], [["music", 45.37], ["throbbing", 12.14], ["speech", 7.62]], null, [["music", 22.99], ["explosion", 9.16], ["speech", 8.41]], null, [["speech", 51.13], ["music", 12.43], ["vehicle", 6.66]], [["speech", 48.45], ["music", 25.73], ["vehicle", 4.84]], [["music", 35.11], ["speech", 31.38], ["burst, pop", 3.77]], [["music", 33.35], ["hum", 14.33], ["throbbing", 13.81]], [["speech", 45.82], ["buzz", 8.25], ["music", 7.77]]], "duration": [4.81, 6.91, 0.56, 20.44, 30.38, 11.66, 7.65, 28.46, 4.5, 10.64]} \ No newline at end of file diff --git a/annotations_filtered/fYvvenxELZA_filtered.json b/annotations_filtered/fYvvenxELZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56589511c6a5dac382d2c513e63b861243a8505d --- /dev/null +++ b/annotations_filtered/fYvvenxELZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.98], [7.0, 8.18], [8.0, 8.9], [9.0, 21.74], [23.0, 23.6], [25.0, 37.08], [38.0, 39.72], [40.0, 41.72], [44.0, 45.74], [48.0, 51.85], [53.0, 65.43], [70.0, 72.37], [75.0, 74.87], [78.0, 86.02], [88.0, 102.95], [103.0, 104.19]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false], "silence_prob": [65.32, 0.0, 0.0, 38.55, 0.0, 49.73, 0.0, 0.0, 0.0, 40.14, 47.78, 48.69, 0.0, 45.59, 33.54, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 69.98], ["mains hum", 4.68], ["hum", 4.22]], null, [["music", 64.85], ["whale vocalization", 5.19], ["hum", 4.89]], null, null, null, [["mains hum", 16.69], ["fly, housefly", 15.51], ["insect", 10.09]], [["music", 42.96], ["buzz", 10.62], ["didgeridoo", 6.0]], [["music", 43.09], ["synthesizer", 8.7], ["theremin", 7.19]], null, [["didgeridoo", 31.97], ["music", 29.03], ["speech", 7.2]], [["hum", 29.9], ["music", 27.37], ["mains hum", 16.54]], null], "duration": [3.98, 1.18, 0.9, 12.74, 0.6, 12.08, 1.72, 1.72, 1.74, 3.85, 12.43, 2.37, -0.13, 8.02, 14.95, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/fZ7X5JDKmSI_filtered.json b/annotations_filtered/fZ7X5JDKmSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83dff8637b945ace57a4496a693e32b571e11d3e --- /dev/null +++ b/annotations_filtered/fZ7X5JDKmSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.95], [6.0, 6.61], [10.0, 10.12], [23.0, 24.24], [29.0, 29.1], [33.0, 34.7], [36.0, 37.39], [39.0, 39.24], [41.0, 41.01], [42.0, 42.79], [73.0, 75.15], [78.0, 78.9], [80.0, 81.01], [84.0, 84.7], [87.0, 87.62], [96.0, 100.08], [101.0, 101.65], [102.0, 104.46], [108.0, 111.81], [129.0, 134.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.87, 0.0, 0.0, 0.0, 0.0, 31.65, 0.0, 35.69, 33.08, 34.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 50.58], ["music", 5.06], ["vehicle", 3.07]], null, null, null, null, [["didgeridoo", 27.69], ["music", 25.38], ["musical instrument", 5.02]], null, [["theremin", 86.27], ["music", 7.6], ["musical instrument", 0.83]], [["music", 66.58], ["didgeridoo", 8.08], ["musical instrument", 6.35]], [["theremin", 38.87], ["music", 24.84], ["musical instrument", 4.31]]], "duration": [0.95, 0.61, 0.12, 1.24, 0.1, 1.7, 1.39, 0.24, 0.01, 0.79, 2.15, 0.9, 1.01, 0.7, 0.62, 4.08, 0.65, 2.46, 3.81, 5.59]} \ No newline at end of file diff --git a/annotations_filtered/fZB65wj9nz8_filtered.json b/annotations_filtered/fZB65wj9nz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0bd600bbd3c375a64b85c633f52954c30f55d9b --- /dev/null +++ b/annotations_filtered/fZB65wj9nz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.28], [42.0, 42.43], [65.0, 65.3], [74.0, 74.38], [85.0, 85.29], [91.0, 91.15], [92.0, 92.87], [104.0, 104.85], [106.0, 106.64], [109.0, 123.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.43, 0.3, 0.38, 0.29, 0.15, 0.87, 0.85, 0.64, 14.16]} \ No newline at end of file diff --git a/annotations_filtered/fZIWDis34Xs_filtered.json b/annotations_filtered/fZIWDis34Xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f578b0b62f44fe36c25e914391aa8c5093dbd13 --- /dev/null +++ b/annotations_filtered/fZIWDis34Xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.93], [35.0, 41.98], [48.0, 48.64], [58.0, 58.67], [97.0, 98.47]], "keep_status": [true, false, false, false, false], "silence_prob": [35.12, 31.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 54.47], ["electric shaver, electric razor", 6.45], ["radio", 6.23]], [["speech", 95.12], ["telephone", 1.51], ["telephone bell ringing", 0.68]], null, null, null], "duration": [3.93, 6.98, 0.64, 0.67, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/fZNHk9DKvtM_filtered.json b/annotations_filtered/fZNHk9DKvtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce0f559336b1fa6626679eb37c28a20c54130aad --- /dev/null +++ b/annotations_filtered/fZNHk9DKvtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [5.0, 5.9], [7.0, 7.55], [9.0, 10.02], [11.0, 12.21], [13.0, 16.71], [21.0, 21.74], [23.0, 24.43], [26.0, 26.15], [27.0, 26.99], [29.0, 29.3], [30.0, 40.02], [43.0, 43.09], [47.0, 48.73], [51.0, 52.29], [54.0, 55.71], [60.0, 77.5], [80.0, 85.9], [89.0, 90.32], [93.0, 96.31], [97.0, 97.33], [98.0, 104.14], [115.0, 115.33], [121.0, 123.38], [130.0, 130.17], [135.0, 135.01], [135.0, 135.04], [135.0, 135.23], [135.0, 135.26], [135.0, 141.79], [148.0, 151.23], [154.0, 154.38], [156.0, 155.82], [159.0, 160.17], [160.0, 161.86], [163.0, 163.17], [166.0, 179.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 59.15, 96.77, 0.0, 83.88, 0.0, 31.13, 0.0, 30.94, 0.0, 0.0, 0.0, 0.0, 0.0, 30.16, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 32.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.68], ["livestock, farm animals, working animals", 11.78], ["cattle, bovinae", 10.94]], null, [["speech", 31.35], ["skateboard", 6.9], ["fart", 6.11]], null, null, null, null, null, [["throbbing", 24.08], ["speech", 15.71], ["sidetone", 12.81]], [["speech", 22.86], ["sidetone", 22.17], ["music", 21.68]], null, null, null, null, null, [["music", 42.91], ["hum", 25.1], ["throbbing", 23.49]]], "duration": [0.54, 0.9, 0.55, 1.02, 1.21, 3.71, 0.74, 1.43, 0.15, -0.01, 0.3, 10.02, 0.09, 1.73, 1.29, 1.71, 17.5, 5.9, 1.32, 3.31, 0.33, 6.14, 0.33, 2.38, 0.17, 0.01, 0.04, 0.23, 0.26, 6.79, 3.23, 0.38, -0.18, 1.17, 1.86, 0.17, 13.46]} \ No newline at end of file diff --git a/annotations_filtered/fZNPbMu2Ge0_filtered.json b/annotations_filtered/fZNPbMu2Ge0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42af816135072b737f5cd6281006e3f75e7c72a4 --- /dev/null +++ b/annotations_filtered/fZNPbMu2Ge0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 33.2], [34.0, 35.36], [36.0, 37.86], [38.0, 44.27], [46.0, 47.16], [48.0, 51.51], [54.0, 54.14], [56.0, 56.73], [61.0, 62.43], [64.0, 64.44], [66.0, 66.16], [69.0, 68.82], [71.0, 71.41], [73.0, 75.05], [76.0, 76.2], [83.0, 85.35], [86.0, 87.3], [88.0, 89.31], [91.0, 92.67], [93.0, 95.18], [96.0, 101.04], [102.0, 104.3], [105.0, 106.02], [107.0, 116.16], [118.0, 119.72], [121.0, 123.23], [126.0, 130.92], [133.0, 142.28], [146.0, 146.82], [148.0, 151.29], [152.0, 154.95], [156.0, 157.74], [159.0, 159.27], [160.0, 161.86], [171.0, 171.66], [173.0, 172.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 99.62, 99.95, 0.0, 99.99, 0.0, 99.99, 99.95, 95.78, 0.0, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.2, 1.36, 1.86, 6.27, 1.16, 3.51, 0.14, 0.73, 1.43, 0.44, 0.16, -0.18, 0.41, 2.05, 0.2, 2.35, 1.3, 1.31, 1.67, 2.18, 5.04, 2.3, 1.02, 9.16, 1.72, 2.23, 4.92, 9.28, 0.82, 3.29, 2.95, 1.74, 0.27, 1.86, 0.66, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/fZXtCHoRb50_filtered.json b/annotations_filtered/fZXtCHoRb50_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f231042f76714611f0c92a2cea834333dee97cd --- /dev/null +++ b/annotations_filtered/fZXtCHoRb50_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [11.0, 11.77], [16.0, 18.01], [23.0, 23.57], [26.0, 26.99], [28.0, 28.29], [29.0, 34.18], [35.0, 36.91], [41.0, 41.28], [42.0, 42.5], [44.0, 44.71], [45.0, 46.63], [49.0, 50.21], [55.0, 55.43], [72.0, 72.64], [80.0, 80.5], [81.0, 81.85], [82.0, 83.46], [85.0, 85.56], [86.0, 86.58], [90.0, 89.94], [94.0, 95.08], [99.0, 99.55], [129.0, 129.68], [133.0, 135.19], [138.0, 138.43]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 40.62, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.61, 0.0], "audiomae_on_audioset": [null, null, [["music", 21.52], ["speech", 14.37], ["vehicle", 3.84]], null, null, null, [["fly, housefly", 20.05], ["insect", 16.93], ["speech", 10.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.86], ["music", 5.34], ["hum", 5.03]], null], "duration": [1.62, 0.77, 2.01, 0.57, 0.99, 0.29, 5.18, 1.91, 0.28, 0.5, 0.71, 1.63, 1.21, 0.43, 0.64, 0.5, 0.85, 1.46, 0.56, 0.58, -0.06, 1.08, 0.55, 0.68, 2.19, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/fZflzybv5T0_filtered.json b/annotations_filtered/fZflzybv5T0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd1ed48c3948c5cf9a3d35bc19b88a7a871260cc --- /dev/null +++ b/annotations_filtered/fZflzybv5T0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.35], [12.0, 13.17], [13.0, 13.64], [19.0, 20.46], [21.0, 22.57], [28.0, 29.62], [32.0, 32.75], [38.0, 41.77], [47.0, 48.0]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.35, 1.17, 0.64, 1.46, 1.57, 1.62, 0.75, 3.77, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/fZrN9LabLQQ_filtered.json b/annotations_filtered/fZrN9LabLQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b534775b38f3793ac0a274829310e855a95fb9d2 --- /dev/null +++ b/annotations_filtered/fZrN9LabLQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 17.41], [21.0, 23.63], [28.0, 32.58], [36.0, 39.33], [43.0, 58.16], [62.0, 102.68], [107.0, 110.13], [112.0, 114.34], [116.0, 146.97], [149.0, 149.42], [161.0, 162.87], [164.0, 165.3], [167.0, 167.61]], "keep_status": [true, true, false, true, true, false, true, true, false, false, false, false, false], "silence_prob": [29.14, 29.13, 34.72, 30.83, 29.05, 0.0, 31.62, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.82], ["hum", 7.05], ["mains hum", 6.28]], [["mains hum", 30.76], ["hum", 24.9], ["throbbing", 11.58]], [["music", 40.23], ["speech", 28.37], ["hum", 5.28]], [["music", 17.71], ["mains hum", 16.32], ["buzz", 10.05]], [["music", 55.85], ["whip", 4.84], ["whoosh, swoosh, swish", 3.73]], null, [["speech", 41.1], ["vehicle", 7.75], ["hum", 7.4]], [["speech", 54.3], ["vehicle", 9.85], ["music", 2.98]], null, null, null, null, null], "duration": [8.41, 2.63, 4.58, 3.33, 15.16, 40.68, 3.13, 2.34, 30.97, 0.42, 1.87, 1.3, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/fZt8dti-r14_filtered.json b/annotations_filtered/fZt8dti-r14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6afe20323455abc422d7aff63bb86fb0a2f10210 --- /dev/null +++ b/annotations_filtered/fZt8dti-r14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 47.24], [60.0, 60.86], [61.0, 61.42], [67.0, 127.38]], "keep_status": [false, false, false, false], "silence_prob": [30.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 76.38], ["carnatic music", 3.58], ["swing music", 2.53]], null, null, null], "duration": [11.24, 0.86, 0.42, 60.38]} \ No newline at end of file diff --git a/annotations_filtered/fZzxZa0k7II_filtered.json b/annotations_filtered/fZzxZa0k7II_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c01bb93e50efe2b9f52a820655fd06509d93e8e0 --- /dev/null +++ b/annotations_filtered/fZzxZa0k7II_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.84], [9.0, 17.81], [19.0, 82.86], [86.0, 105.19]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 43.28, 0.0, 30.92], "audiomae_on_audioset": [null, [["hum", 29.84], ["throbbing", 22.23], ["music", 10.44]], null, [["music", 43.92], ["buzz", 13.58], ["hum", 4.85]]], "duration": [1.84, 8.81, 63.86, 19.19]} \ No newline at end of file diff --git a/annotations_filtered/f_5nHV8FJyI_filtered.json b/annotations_filtered/f_5nHV8FJyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05baffb786e54c99efa979068b905dd7d5e97af9 --- /dev/null +++ b/annotations_filtered/f_5nHV8FJyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.29], [6.0, 6.44], [7.0, 7.5], [16.0, 16.16], [41.0, 42.16], [42.0, 42.48], [43.0, 54.51], [56.0, 56.66], [63.0, 64.4], [65.0, 65.55], [66.0, 66.78], [68.0, 68.32], [69.0, 70.29], [71.0, 76.69], [77.0, 77.62], [79.0, 78.83], [79.0, 79.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [34.19, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 65.42], ["music", 3.98], ["beatboxing", 3.67]], null, null, null, null, null, [["wail, moan", 35.03], ["speech", 10.28], ["groan", 6.73]], null, null, null, null, null, null, [["beatboxing", 44.97], ["speech", 13.41], ["fart", 9.04]], null, null, null], "duration": [3.29, 0.44, 0.5, 0.16, 1.16, 0.48, 11.51, 0.66, 1.4, 0.55, 0.78, 0.32, 1.29, 5.69, 0.62, -0.17, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/f_G1oYcHFsk_filtered.json b/annotations_filtered/f_G1oYcHFsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b5241c194949eaeea509311791eb50a64b7f648 --- /dev/null +++ b/annotations_filtered/f_G1oYcHFsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 29.98], [32.0, 32.31], [37.0, 36.66], [51.0, 50.87], [55.0, 62.28], [63.0, 70.51], [77.0, 88.37], [92.0, 92.06], [94.0, 109.98], [110.0, 112.16], [113.0, 119.3], [120.0, 120.16], [120.0, 120.28], [121.0, 131.77]], "keep_status": [true, false, false, false, false, true, true, false, true, true, true, false, false, false], "silence_prob": [32.87, 0.0, 0.0, 0.0, 32.77, 31.86, 33.32, 0.0, 34.6, 40.5, 35.62, 0.0, 0.0, 31.59], "audiomae_on_audioset": [[["speech", 21.33], ["cattle, bovinae", 19.99], ["moo", 17.35]], null, null, null, [["speech", 44.13], ["cattle, bovinae", 15.2], ["moo", 10.88]], [["speech", 25.85], ["cattle, bovinae", 23.43], ["moo", 17.23]], [["fart", 30.94], ["speech", 12.67], ["livestock, farm animals, working animals", 10.4]], null, [["fly, housefly", 26.09], ["livestock, farm animals, working animals", 12.67], ["cattle, bovinae", 11.81]], [["speech", 47.86], ["busy signal", 9.38], ["dog", 3.51]], [["speech", 36.3], ["sidetone", 14.02], ["synthesizer", 9.47]], null, null, [["music", 49.42], ["synthesizer", 12.74], ["didgeridoo", 10.62]]], "duration": [19.98, 0.31, -0.34, -0.13, 7.28, 7.51, 11.37, 0.06, 15.98, 2.16, 6.3, 0.16, 0.28, 10.77]} \ No newline at end of file diff --git a/annotations_filtered/f_GI8syIgIs_filtered.json b/annotations_filtered/f_GI8syIgIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0d96cae94d9098f04a2adb34d4c8ec0f4234e0 --- /dev/null +++ b/annotations_filtered/f_GI8syIgIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.9], [19.0, 23.21], [24.0, 25.44], [28.0, 31.92], [35.0, 36.53], [37.0, 36.59], [37.0, 39.33], [42.0, 99.76], [102.0, 105.38], [107.0, 108.36], [109.0, 110.71], [111.0, 112.43]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 81.17, 0.0, 52.68, 0.0, 0.0, 31.07, 0.0, 38.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 48.25], ["drum machine", 12.45], ["speech", 8.12]], null, [["speech", 57.56], ["hum", 7.48], ["radio", 4.52]], null, null, null], "duration": [0.9, 4.21, 1.44, 3.92, 1.53, -0.41, 2.33, 57.76, 3.38, 1.36, 1.71, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/f_LDdElm9fc_filtered.json b/annotations_filtered/f_LDdElm9fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3d421efb26f3488ad169b38f717f7e803797fa --- /dev/null +++ b/annotations_filtered/f_LDdElm9fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.35], [20.0, 48.17], [49.0, 51.19], [51.0, 60.44], [63.0, 63.39], [64.0, 102.32], [107.0, 110.25], [117.0, 129.47], [130.0, 130.77], [132.0, 138.15], [139.0, 139.78], [141.0, 143.41], [145.0, 145.5]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [29.24, 28.49, 34.44, 29.55, 0.0, 0.0, 28.21, 29.03, 0.0, 29.65, 0.0, 96.42, 0.0], "audiomae_on_audioset": [[["mains hum", 33.1], ["hum", 22.2], ["music", 13.89]], [["speech", 47.4], ["music", 15.51], ["hum", 6.18]], [["music", 35.49], ["speech", 24.0], ["electronic music", 4.87]], [["mains hum", 46.37], ["hum", 42.12], ["music", 2.9]], null, null, [["music", 14.94], ["hum", 13.72], ["mains hum", 9.28]], [["speech", 54.72], ["music", 21.99], ["sidetone", 6.46]], null, [["music", 39.7], ["throbbing", 22.17], ["hum", 20.15]], null, null, null], "duration": [7.35, 28.17, 2.19, 9.44, 0.39, 38.32, 3.25, 12.47, 0.77, 6.15, 0.78, 2.41, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/f_Pc2_cTQnk_filtered.json b/annotations_filtered/f_Pc2_cTQnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..097182dd7d0ce9d058498bb6b6ec71cc6fd936a4 --- /dev/null +++ b/annotations_filtered/f_Pc2_cTQnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.19], [18.0, 37.03], [39.0, 46.94], [48.0, 48.79], [52.0, 57.42], [58.0, 61.42], [66.0, 72.94], [75.0, 77.52], [78.0, 91.37], [92.0, 129.54], [134.0, 134.81], [137.0, 137.81], [140.0, 141.37], [148.0, 148.88], [156.0, 156.36], [160.0, 161.11], [161.0, 162.45], [169.0, 169.38]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.74, 52.16, 0.0, 60.42, 50.97, 47.7, 48.69, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.19], ["hum", 10.58], ["cat", 9.41]], null, null, null, null, [["hum", 50.12], ["mains hum", 11.14], ["arrow", 10.89]], [["sidetone", 32.96], ["speech", 28.36], ["sine wave", 11.15]], [["speech", 28.34], ["mains hum", 19.74], ["hum", 18.8]], null, null, null, null, null, null, null, null, null], "duration": [0.19, 19.03, 7.94, 0.79, 5.42, 3.42, 6.94, 2.52, 13.37, 37.54, 0.81, 0.81, 1.37, 0.88, 0.36, 1.11, 1.45, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/f_XHjqABQQA_filtered.json b/annotations_filtered/f_XHjqABQQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bea1dd998308bac9ee6c780ecca4b229a99dec68 --- /dev/null +++ b/annotations_filtered/f_XHjqABQQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [10.0, 12.5], [13.0, 13.86], [16.0, 17.09], [17.0, 18.57], [22.0, 24.07], [27.0, 27.7], [38.0, 42.36], [47.0, 47.68], [48.0, 48.63], [50.0, 51.66], [62.0, 61.64], [65.0, 67.32], [72.0, 72.62], [78.0, 79.34], [80.0, 92.15], [95.0, 95.59], [110.0, 110.73], [120.0, 121.8]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 41.24, 0.0, 0.0, 0.0, 41.09, 0.0, 39.49, 0.0, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 46.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.16], ["music", 26.68], ["synthesizer", 8.48]], null, null, null, [["music", 49.99], ["didgeridoo", 37.8], ["musical instrument", 3.22]], null, [["music", 28.07], ["speech", 17.3], ["throbbing", 13.22]], null, null, null, null, [["music", 36.98], ["throbbing", 17.91], ["hum", 10.59]], null, null, [["speech", 38.51], ["heart sounds, heartbeat", 6.42], ["hum", 5.97]], null, null, null], "duration": [0.53, 2.5, 0.86, 1.09, 1.57, 2.07, 0.7, 4.36, 0.68, 0.63, 1.66, -0.36, 2.32, 0.62, 1.34, 12.15, 0.59, 0.73, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/f_lRMCPHbuY_filtered.json b/annotations_filtered/f_lRMCPHbuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58745498bdec76dcc8174e5e0bb8ebde088a4d9d --- /dev/null +++ b/annotations_filtered/f_lRMCPHbuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [5.0, 24.39], [26.0, 27.28], [28.0, 30.62], [32.0, 33.3], [35.0, 35.06], [37.0, 37.98], [42.0, 43.09], [46.0, 47.66], [49.0, 50.19], [51.0, 51.66], [52.0, 54.19], [57.0, 57.47], [59.0, 59.85], [61.0, 61.67], [64.0, 70.75], [75.0, 79.76], [87.0, 89.48], [90.0, 90.69], [99.0, 99.74], [102.0, 102.66], [106.0, 108.99], [111.0, 112.72], [121.0, 122.4], [124.0, 124.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.53, 0.0, 41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 38.3, 51.34, 43.35, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 27.64], ["insect", 12.53], ["speech", 9.69]], null, null, null, null, null, null, null, [["hum", 31.15], ["speech", 21.13], ["throbbing", 9.85]], null, null, null, [["sidetone", 36.26], ["speech", 22.84], ["fly, housefly", 7.92]], null, [["hum", 33.18], ["rumble", 8.02], ["whale vocalization", 5.95]], null, null, null, null, null, null, null], "duration": [0.93, 19.39, 1.28, 2.62, 1.3, 0.06, 0.98, 1.09, 1.66, 1.19, 0.66, 2.19, 0.47, 0.85, 0.67, 6.75, 4.76, 2.48, 0.69, 0.74, 0.66, 2.99, 1.72, 1.4, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/f_sRtGI7Y0g_filtered.json b/annotations_filtered/f_sRtGI7Y0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87d85812af263a029a9ba9159e249c8229df9405 --- /dev/null +++ b/annotations_filtered/f_sRtGI7Y0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.9], [24.0, 24.07], [26.0, 27.4], [28.0, 28.05], [29.0, 29.02], [38.0, 38.23], [39.0, 39.36], [43.0, 42.77], [56.0, 57.28], [68.0, 72.94], [76.0, 77.18], [79.0, 81.23], [82.0, 83.67], [86.0, 86.32], [95.0, 98.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 0.07, 1.4, 0.05, 0.02, 0.23, 0.36, -0.23, 1.28, 4.94, 1.18, 2.23, 1.67, 0.32, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/f_xjQNnIcdQ_filtered.json b/annotations_filtered/f_xjQNnIcdQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22fd0e5fe3cba3dd6878d4e9099444ab6b00f071 --- /dev/null +++ b/annotations_filtered/f_xjQNnIcdQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.14], [21.0, 22.44], [24.0, 38.35], [41.0, 49.49], [51.0, 52.29], [56.0, 59.29], [60.0, 60.81], [68.0, 79.32], [80.0, 89.51], [91.0, 96.84], [101.0, 127.7]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.68, 32.94, 0.0, 34.4, 0.0, 31.03, 31.33, 31.53, 31.38], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 37.55], ["livestock, farm animals, working animals", 29.83], ["moo", 27.96]], [["cattle, bovinae", 49.09], ["moo", 38.43], ["livestock, farm animals, working animals", 12.45]], null, [["music", 45.0], ["sidetone", 11.25], ["speech", 7.45]], null, [["cattle, bovinae", 40.84], ["moo", 35.95], ["livestock, farm animals, working animals", 19.41]], [["cattle, bovinae", 42.61], ["moo", 34.31], ["livestock, farm animals, working animals", 17.12]], [["cattle, bovinae", 46.92], ["moo", 38.89], ["livestock, farm animals, working animals", 14.01]], [["music", 71.97], ["synthesizer", 3.2], ["speech", 2.09]]], "duration": [0.14, 1.44, 14.35, 8.49, 1.29, 3.29, 0.81, 11.32, 9.51, 5.84, 26.7]} \ No newline at end of file diff --git a/annotations_filtered/f_zpkjkB8ac_filtered.json b/annotations_filtered/f_zpkjkB8ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d42e6bae912728f5e076e973b316991a0dee99bb --- /dev/null +++ b/annotations_filtered/f_zpkjkB8ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.78], [7.0, 17.24], [25.0, 25.47], [31.0, 32.07], [37.0, 38.92], [42.0, 45.82], [48.0, 48.29], [53.0, 54.01], [58.0, 58.09], [76.0, 76.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.22, 10.24, 0.47, 1.07, 1.92, 3.82, 0.29, 1.01, 0.09, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/fa4IKrf2YHI_filtered.json b/annotations_filtered/fa4IKrf2YHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1375d57ef642c7d6b020f160ab2108a422d6eed9 --- /dev/null +++ b/annotations_filtered/fa4IKrf2YHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [3.0, 4.04], [4.0, 5.09], [14.0, 16.28], [19.0, 20.02], [21.0, 21.36], [22.0, 24.06], [28.0, 29.59], [30.0, 30.69], [31.0, 31.5], [33.0, 35.11], [36.0, 38.45], [42.0, 43.5], [44.0, 46.87], [48.0, 49.27], [54.0, 55.95], [58.0, 59.91], [69.0, 70.92], [72.0, 74.78], [76.0, 77.4], [78.0, 79.24], [84.0, 85.78], [88.0, 88.84], [90.0, 90.51], [93.0, 93.61], [94.0, 97.31], [104.0, 110.79], [115.0, 117.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 96.04, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 1.04, 1.09, 2.28, 1.02, 0.36, 2.06, 1.59, 0.69, 0.5, 2.11, 2.45, 1.5, 2.87, 1.27, 1.95, 1.91, 1.92, 2.78, 1.4, 1.24, 1.78, 0.84, 0.51, 0.61, 3.31, 6.79, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/faEbd7LEDOw_filtered.json b/annotations_filtered/faEbd7LEDOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fab67d7bd788ebcc92954bceccdfc62ed8ba3c3f --- /dev/null +++ b/annotations_filtered/faEbd7LEDOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [4.0, 5.41], [7.0, 7.11], [14.0, 14.55], [17.0, 16.82], [34.0, 34.03], [38.0, 42.01], [48.0, 52.74], [55.0, 55.48], [59.0, 67.37], [71.0, 71.69], [73.0, 73.16], [74.0, 74.76], [78.0, 79.03], [80.0, 79.89], [87.0, 87.0], [102.0, 103.17], [104.0, 104.85], [106.0, 106.29], [112.0, 120.61], [129.0, 129.09], [130.0, 136.17], [139.0, 139.78], [141.0, 141.27], [142.0, 142.13], [144.0, 144.34], [146.0, 146.7], [150.0, 150.28], [151.0, 151.6], [153.0, 153.66], [155.0, 155.16], [165.0, 165.2], [166.0, 166.94], [170.0, 170.58], [174.0, 174.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 52.92, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 59.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 1.41, 0.11, 0.55, -0.18, 0.03, 4.01, 4.74, 0.48, 8.37, 0.69, 0.16, 0.76, 1.03, -0.11, 0.0, 1.17, 0.85, 0.29, 8.61, 0.09, 6.17, 0.78, 0.27, 0.13, 0.34, 0.7, 0.28, 0.6, 0.66, 0.16, 0.2, 0.94, 0.58, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/faMh6OYfuNE_filtered.json b/annotations_filtered/faMh6OYfuNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..029450d4bae516d7dbadf214100fee50d100f221 --- /dev/null +++ b/annotations_filtered/faMh6OYfuNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [9.0, 9.12], [12.0, 12.88], [15.0, 15.2], [26.0, 28.21], [32.0, 33.27], [39.0, 39.93], [48.0, 49.0], [55.0, 56.25], [60.0, 60.2], [63.0, 64.66], [70.0, 73.13], [80.0, 82.43], [101.0, 102.32], [105.0, 104.97], [107.0, 110.3], [121.0, 121.44], [122.0, 123.16], [124.0, 125.2], [126.0, 126.81], [130.0, 130.32], [138.0, 138.08], [147.0, 147.23], [152.0, 153.05], [155.0, 155.95], [163.0, 163.7], [167.0, 168.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.17, 91.13, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.72], ["thunk", 10.51], ["fly, housefly", 10.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 0.12, 0.88, 0.2, 2.21, 1.27, 0.93, 1.0, 1.25, 0.2, 1.66, 3.13, 2.43, 1.32, -0.03, 3.3, 0.44, 1.16, 1.2, 0.81, 0.32, 0.08, 0.23, 1.05, 0.95, 0.7, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/faRFVdrRpws_filtered.json b/annotations_filtered/faRFVdrRpws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed797af7139b23d711d58a9c0490ee9302e25b4e --- /dev/null +++ b/annotations_filtered/faRFVdrRpws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.35], [9.0, 10.54], [15.0, 15.82], [25.0, 25.98], [34.0, 33.88], [38.0, 38.67], [42.0, 42.57], [63.0, 64.66], [76.0, 75.96], [77.0, 79.34], [83.0, 85.09], [92.0, 92.8], [96.0, 97.75], [103.0, 103.1], [107.0, 107.47], [113.0, 115.75], [117.0, 117.49], [118.0, 117.59], [118.0, 118.25], [119.0, 120.61], [124.0, 123.74], [129.0, 128.83], [146.0, 145.98], [147.0, 148.14], [153.0, 155.88], [159.0, 164.25], [167.0, 172.99], [182.0, 186.95]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.91, 42.42, 0.0, 0.0, 0.0, 0.0, 39.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.46, 30.6, 29.91, 30.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 56.85], ["theremin", 7.75], ["singing", 3.1]], [["music", 33.41], ["theremin", 29.62], ["speech", 7.31]], null, null, null, null, [["music", 77.08], ["theremin", 4.32], ["musical instrument", 2.11]], null, null, null, null, null, null, null, null, [["music", 62.64], ["theremin", 9.63], ["opera", 5.82]], [["music", 64.6], ["synthesizer", 6.62], ["theremin", 6.08]], [["music", 56.68], ["theremin", 10.26], ["foghorn", 4.97]], [["music", 51.24], ["theremin", 23.64], ["singing", 2.33]]], "duration": [0.35, 1.54, 0.82, 0.98, -0.12, 0.67, 0.57, 1.66, -0.04, 2.34, 2.09, 0.8, 1.75, 0.1, 0.47, 2.75, 0.49, -0.41, 0.25, 1.61, -0.26, -0.17, -0.02, 1.14, 2.88, 5.25, 5.99, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/faX23LNpQGg_filtered.json b/annotations_filtered/faX23LNpQGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e245727e9bd443a07988cb8aa62aedb101dc0a03 --- /dev/null +++ b/annotations_filtered/faX23LNpQGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.57], [17.0, 18.94], [22.0, 23.97], [25.0, 25.86], [28.0, 28.81], [30.0, 30.05], [32.0, 33.66], [35.0, 37.98], [40.0, 40.17], [42.0, 42.7], [44.0, 44.74], [45.0, 45.91], [47.0, 47.39], [48.0, 57.28], [58.0, 60.05], [67.0, 69.47], [71.0, 73.25], [75.0, 76.45], [78.0, 79.02], [80.0, 81.8], [84.0, 84.87], [86.0, 106.34], [110.0, 110.03], [112.0, 117.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 90.6, 83.52, 100.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.94, 1.97, 0.86, 0.81, 0.05, 1.66, 2.98, 0.17, 0.7, 0.74, 0.91, 0.39, 9.28, 2.05, 2.47, 2.25, 1.45, 1.02, 1.8, 0.87, 20.34, 0.03, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/farC0cWkpvc_filtered.json b/annotations_filtered/farC0cWkpvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..742d95441dda655d797ac6d27b7a3f22950b3966 --- /dev/null +++ b/annotations_filtered/farC0cWkpvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [4.0, 5.88], [7.0, 8.18], [9.0, 10.27], [12.0, 15.85], [18.0, 19.4], [21.0, 25.34], [27.0, 29.03], [32.0, 33.62], [37.0, 37.69], [39.0, 40.37], [41.0, 45.93], [48.0, 49.35], [50.0, 50.55], [53.0, 56.25], [57.0, 58.29], [62.0, 64.0], [65.0, 65.04], [66.0, 69.58], [72.0, 72.25], [74.0, 74.93], [77.0, 77.72], [79.0, 79.17], [80.0, 81.18], [84.0, 85.01], [85.0, 85.97], [88.0, 88.87], [90.0, 91.3], [94.0, 113.46], [116.0, 116.94], [117.0, 117.61], [119.0, 119.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 89.01, 88.83, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 64.86, 0.0, 99.59, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 1.88, 1.18, 1.27, 3.85, 1.4, 4.34, 2.03, 1.62, 0.69, 1.37, 4.93, 1.35, 0.55, 3.25, 1.29, 2.0, 0.04, 3.58, 0.25, 0.93, 0.72, 0.17, 1.18, 1.01, 0.97, 0.87, 1.3, 19.46, 0.94, 0.61, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/fb-9_MV15I4_filtered.json b/annotations_filtered/fb-9_MV15I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/fb-9_MV15I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/fbDgv4huUp4_filtered.json b/annotations_filtered/fbDgv4huUp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa44cfaa29d7f9b4c7465bf84d7fee9e68258d85 --- /dev/null +++ b/annotations_filtered/fbDgv4huUp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 55.11], [55.0, 56.05], [58.0, 64.45], [68.0, 70.53], [72.0, 72.82], [77.0, 77.06], [80.0, 80.42], [83.0, 86.56], [87.0, 88.6], [92.0, 101.51], [104.0, 105.98], [107.0, 115.1], [117.0, 138.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 38.62, 92.64, 0.0, 0.0, 0.0, 43.13, 0.0, 29.37, 0.0, 30.41, 31.32], "audiomae_on_audioset": [null, null, [["music", 47.2], ["hum", 16.46], ["throbbing", 13.69]], null, null, null, null, [["hum", 44.46], ["throbbing", 14.59], ["music", 12.22]], null, [["speech", 38.06], ["music", 30.58], ["crowd", 4.98]], null, [["music", 48.08], ["speech", 14.88], ["thunk", 3.83]], [["music", 20.52], ["gong", 14.62], ["speech", 10.63]]], "duration": [48.11, 1.05, 6.45, 2.53, 0.82, 0.06, 0.42, 3.56, 1.6, 9.51, 1.98, 8.1, 21.6]} \ No newline at end of file diff --git a/annotations_filtered/fbNz1vlRSyM_filtered.json b/annotations_filtered/fbNz1vlRSyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b986be8170544c20d167209992bea816e5824d8e --- /dev/null +++ b/annotations_filtered/fbNz1vlRSyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.18], [0.0, 5.51], [13.0, 13.46], [18.0, 19.21], [21.0, 21.19], [22.0, 38.75], [43.0, 72.1], [74.0, 74.88]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.72, 0.0, 0.0, 0.0, 30.77, 30.85, 0.0], "audiomae_on_audioset": [null, [["music", 79.45], ["didgeridoo", 1.56], ["electronic music", 1.45]], null, null, null, [["music", 81.33], ["musical instrument", 2.61], ["singing", 2.22]], [["music", 65.89], ["yodeling", 8.78], ["singing", 4.25]], null], "duration": [0.18, 5.51, 0.46, 1.21, 0.19, 16.75, 29.1, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/fbR1gtlY7FM_filtered.json b/annotations_filtered/fbR1gtlY7FM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40454eb811f461b4681b8438027526950cbf0d3b --- /dev/null +++ b/annotations_filtered/fbR1gtlY7FM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 73.38]], "keep_status": [false], "silence_prob": [30.58], "audiomae_on_audioset": [[["vehicle", 44.31], ["skidding", 21.74], ["car", 15.11]]], "duration": [25.38]} \ No newline at end of file diff --git a/annotations_filtered/fbYS5f3GFek_filtered.json b/annotations_filtered/fbYS5f3GFek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e290f2f0324243e741d02dade47d8eea133a1d4d --- /dev/null +++ b/annotations_filtered/fbYS5f3GFek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.84], [5.0, 6.57], [11.0, 13.17], [17.0, 19.21], [21.0, 22.49], [24.0, 24.93], [26.0, 28.53], [29.0, 32.32], [39.0, 51.7], [53.0, 53.84], [55.0, 56.22], [56.0, 56.44], [56.0, 58.46], [62.0, 63.1]], "keep_status": [false, false, true, true, false, false, true, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 41.05, 46.09, 0.0, 0.0, 41.64, 47.5, 42.69, 0.0, 0.0, 0.0, 34.76, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.26], ["didgeridoo", 9.47], ["speech", 6.14]], [["music", 56.16], ["speech", 5.95], ["musical instrument", 4.28]], null, null, [["music", 46.23], ["guitar", 7.24], ["bass guitar", 5.96]], [["music", 38.29], ["guitar", 7.34], ["hum", 6.3]], [["speech", 42.82], ["music", 37.27], ["drip", 4.22]], null, null, null, [["music", 15.1], ["thunk", 11.32], ["speech", 4.96]], null], "duration": [0.84, 1.57, 2.17, 2.21, 1.49, 0.93, 2.53, 3.32, 12.7, 0.84, 1.22, 0.44, 2.46, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/fbbatiKJ6rQ_filtered.json b/annotations_filtered/fbbatiKJ6rQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a742b86cbc56686b8b2620d9caf2eb3a74e97c60 --- /dev/null +++ b/annotations_filtered/fbbatiKJ6rQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.66], [12.0, 45.52], [49.0, 49.22], [50.0, 50.35], [60.0, 66.73], [67.0, 66.78], [67.0, 66.9], [67.0, 67.58], [69.0, 69.84], [74.0, 74.34], [77.0, 77.67], [82.0, 82.29], [82.0, 85.87], [91.0, 91.03], [92.0, 93.88], [99.0, 100.87], [105.0, 106.17], [107.0, 107.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [33.17, 0.0, 0.0, 0.0, 31.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.76], ["beatboxing", 12.51], ["drum machine", 6.54]], null, null, null, [["speech", 66.09], ["crowd", 4.77], ["hum", 2.74]], null, null, null, null, null, null, null, [["mains hum", 21.79], ["hum", 15.53], ["speech", 11.84]], null, null, null, null, null], "duration": [2.66, 33.52, 0.22, 0.35, 6.73, -0.22, -0.1, 0.58, 0.84, 0.34, 0.67, 0.29, 3.87, 0.03, 1.88, 1.87, 1.17, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/fbkfr-S420o_filtered.json b/annotations_filtered/fbkfr-S420o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ec8da8ed604e2b9600ea410b6b6c67b47b356a0 --- /dev/null +++ b/annotations_filtered/fbkfr-S420o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.86], [20.0, 21.73], [22.0, 23.09], [28.0, 28.07], [29.0, 31.06], [32.0, 36.66], [38.0, 39.12], [41.0, 42.52], [45.0, 47.97], [49.0, 50.68], [52.0, 51.68], [54.0, 53.91], [55.0, 55.66], [57.0, 58.24], [60.0, 63.69], [66.0, 67.58], [69.0, 71.81], [75.0, 75.14], [77.0, 78.36], [79.0, 82.16], [85.0, 88.92], [92.0, 93.6], [96.0, 97.63]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.11, 95.64, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4, 0.0, 33.48, 0.0, 0.0, 33.43, 34.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.68], ["livestock, farm animals, working animals", 17.78], ["moo", 9.18]], null, null, null, null, null, null, null, null, null, [["music", 28.23], ["boing", 18.25], ["sidetone", 11.08]], null, [["music", 53.36], ["speech", 26.8], ["boing", 1.51]], null, null, [["music", 54.58], ["speech", 32.76], ["synthesizer", 3.55]], [["music", 57.48], ["speech", 30.24], ["synthesizer", 2.75]], null, null], "duration": [0.86, 1.73, 1.09, 0.07, 2.06, 4.66, 1.12, 1.52, 2.97, 1.68, -0.32, -0.09, 0.66, 1.24, 3.69, 1.58, 2.81, 0.14, 1.36, 3.16, 3.92, 1.6, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/fbrN51dPm0I_filtered.json b/annotations_filtered/fbrN51dPm0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f17fa2f8993c5be89c2b6ddd0ad1e2687a999a12 --- /dev/null +++ b/annotations_filtered/fbrN51dPm0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [8.0, 8.33], [10.0, 11.37], [14.0, 14.37], [15.0, 15.9], [16.0, 16.41], [16.0, 17.25], [28.0, 28.17], [30.0, 32.48], [73.0, 74.04], [113.0, 113.81], [114.0, 115.15], [120.0, 120.11], [120.0, 122.0], [124.0, 127.26], [130.0, 131.03], [133.0, 134.7], [136.0, 136.0], [137.0, 137.59], [140.0, 158.43], [162.0, 170.75], [172.0, 173.52]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.77, 0.0, 0.0, 0.0, 0.0, 60.6, 57.89, 0.0, 0.0, 0.0, 0.0, 36.05, 33.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 17.81], ["mains hum", 13.99], ["speech", 12.68]], null, null, null, null, null, null, null, null, null, null, [["music", 68.7], ["didgeridoo", 5.91], ["hum", 4.39]], [["hum", 43.04], ["mains hum", 24.12], ["music", 16.65]], null], "duration": [0.38, 0.33, 1.37, 0.37, 0.9, 0.41, 1.25, 0.17, 2.48, 1.04, 0.81, 1.15, 0.11, 2.0, 3.26, 1.03, 1.7, 0.0, 0.59, 18.43, 8.75, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/fbwsXqUpZRU_filtered.json b/annotations_filtered/fbwsXqUpZRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22827955fa6692e4e500fdaedc6a3213d7a2d228 --- /dev/null +++ b/annotations_filtered/fbwsXqUpZRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 5.22], [6.0, 9.32], [10.0, 16.6], [17.0, 18.74], [20.0, 30.96], [43.0, 43.78], [47.0, 47.16], [65.0, 65.94], [68.0, 69.82], [93.0, 93.77], [95.0, 123.42], [124.0, 130.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.0, 55.81, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 36.64, 31.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 75.04], ["musical instrument", 5.66], ["keyboard (musical)", 1.46]], [["speech", 64.76], ["ding", 3.32], ["music", 3.28]]], "duration": [0.94, 1.22, 3.32, 6.6, 1.74, 10.96, 0.78, 0.16, 0.94, 1.82, 0.77, 28.42, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/fc0uxTiUDrE_filtered.json b/annotations_filtered/fc0uxTiUDrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98166ef1c3188515181cc170e89b6596c6a568d4 --- /dev/null +++ b/annotations_filtered/fc0uxTiUDrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.64], [15.0, 14.79], [26.0, 26.08], [31.0, 31.5], [38.0, 47.04], [49.0, 49.4], [66.0, 66.14], [67.0, 67.47], [73.0, 73.84], [75.0, 75.03], [87.0, 87.67], [103.0, 103.03], [106.0, 109.38], [111.0, 110.61], [112.0, 113.44], [115.0, 115.64], [116.0, 117.1], [117.0, 118.29], [122.0, 122.69], [128.0, 129.44], [131.0, 130.6], [134.0, 134.82], [136.0, 136.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 65.61], ["hum", 7.52], ["mains hum", 7.38]], null, null, null, null, null, null, null, [["speech", 55.79], ["radio", 22.36], ["sidetone", 6.99]], null, null, null, null, null, null, null, null, null, null], "duration": [1.64, -0.21, 0.08, 0.5, 9.04, 0.4, 0.14, 0.47, 0.84, 0.03, 0.67, 0.03, 3.38, -0.39, 1.44, 0.64, 1.1, 1.29, 0.69, 1.44, -0.4, 0.82, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/fcFKVVHQn7o_filtered.json b/annotations_filtered/fcFKVVHQn7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a0fce49901011f421145d92fe725e4f5a173f3 --- /dev/null +++ b/annotations_filtered/fcFKVVHQn7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.0], [10.0, 12.02], [13.0, 25.24], [27.0, 26.76], [29.0, 29.19], [30.0, 31.04], [34.0, 34.89], [35.0, 38.57], [39.0, 42.72], [43.0, 44.09], [48.0, 69.4], [74.0, 75.44], [78.0, 80.69], [81.0, 81.84], [82.0, 84.67], [88.0, 91.1], [95.0, 95.34], [96.0, 104.8], [107.0, 118.89], [120.0, 128.11], [132.0, 149.05]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, false, true, true, false, false], "silence_prob": [55.11, 44.99, 35.28, 0.0, 0.0, 0.0, 0.0, 49.97, 38.09, 0.0, 33.9, 0.0, 60.6, 0.0, 59.77, 35.76, 0.0, 35.01, 35.46, 35.36, 32.54], "audiomae_on_audioset": [null, [["music", 28.84], ["trombone", 22.62], ["brass instrument", 21.05]], [["music", 73.88], ["wind instrument, woodwind instrument", 4.13], ["musical instrument", 3.14]], null, null, null, null, [["music", 44.5], ["musical instrument", 7.62], ["foghorn", 6.35]], [["music", 28.29], ["mains hum", 11.77], ["hum", 9.12]], null, [["music", 54.11], ["tabla", 7.45], ["drum", 3.86]], null, null, null, null, [["music", 53.05], ["musical instrument", 6.58], ["drum", 5.41]], null, [["music", 31.99], ["speech", 30.07], ["buzz", 7.0]], [["music", 58.48], ["horse", 4.59], ["brass instrument", 4.56]], [["music", 73.45], ["fart", 3.05], ["didgeridoo", 2.47]], [["music", 75.19], ["theremin", 4.59], ["musical instrument", 2.9]]], "duration": [2.0, 2.02, 12.24, -0.24, 0.19, 1.04, 0.89, 3.57, 3.72, 1.09, 21.4, 1.44, 2.69, 0.84, 2.67, 3.1, 0.34, 8.8, 11.89, 8.11, 17.05]} \ No newline at end of file diff --git a/annotations_filtered/fcfYrTFbM94_filtered.json b/annotations_filtered/fcfYrTFbM94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0422f808533f1a9470303640f68c88e418efe8e --- /dev/null +++ b/annotations_filtered/fcfYrTFbM94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.26], [10.0, 9.86], [12.0, 14.55], [15.0, 21.56], [24.0, 25.54], [26.0, 26.32], [27.0, 27.23], [30.0, 30.81], [33.0, 33.66], [35.0, 35.19], [40.0, 42.57], [44.0, 48.42], [52.0, 53.55], [54.0, 54.95], [56.0, 57.1], [65.0, 65.48], [68.0, 68.71], [75.0, 74.85], [83.0, 83.71], [85.0, 85.36], [87.0, 87.54], [90.0, 91.18], [92.0, 92.77], [95.0, 95.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.25, 0.0, 99.98, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.26, -0.14, 2.55, 6.56, 1.54, 0.32, 0.23, 0.81, 0.66, 0.19, 2.57, 4.42, 1.55, 0.95, 1.1, 0.48, 0.71, -0.15, 0.71, 0.36, 0.54, 1.18, 0.77, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/fcnYQxHinu0_filtered.json b/annotations_filtered/fcnYQxHinu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ecccf0aa9c8d24663cc305cdb2aba70988e6455 --- /dev/null +++ b/annotations_filtered/fcnYQxHinu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [7.0, 6.89], [12.0, 12.38], [12.0, 12.5], [13.0, 12.85], [19.0, 19.2], [22.0, 22.84], [29.0, 29.22], [30.0, 30.4], [35.0, 35.5], [39.0, 39.65], [41.0, 43.95], [46.0, 46.31], [47.0, 47.73], [49.0, 49.33], [58.0, 58.92], [59.0, 60.96], [63.0, 66.09], [67.0, 67.54], [71.0, 73.13], [74.0, 74.6], [82.0, 86.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.55, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.16, 0.0, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 65.17], ["boing", 8.14], ["synthesizer", 2.74]], null, null, null, null, null, null, null, null, null, null], "duration": [0.43, -0.11, 0.38, 0.5, -0.15, 0.2, 0.84, 0.22, 0.4, 0.5, 0.65, 2.95, 0.31, 0.73, 0.33, 0.92, 1.96, 3.09, 0.54, 2.13, 0.6, 4.48]} \ No newline at end of file diff --git a/annotations_filtered/fdOrjwuILCE_filtered.json b/annotations_filtered/fdOrjwuILCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3cd5d83a260add874350b5629d7d5a540e8ef4 --- /dev/null +++ b/annotations_filtered/fdOrjwuILCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 27.46], [29.0, 42.8], [45.0, 46.21], [47.0, 48.59], [50.0, 54.94], [56.0, 61.6], [63.0, 65.72], [66.0, 67.73], [68.0, 69.63], [71.0, 71.36], [72.0, 74.38], [76.0, 77.68], [79.0, 90.04], [90.0, 92.06], [103.0, 103.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [66.03, 99.93, 0.0, 0.0, 97.83, 88.64, 99.88, 0.0, 0.0, 0.0, 99.92, 0.0, 77.2, 38.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.02], ["hum", 13.81], ["electronic music", 6.45]], null], "duration": [8.46, 13.8, 1.21, 1.59, 4.94, 5.6, 2.72, 1.73, 1.63, 0.36, 2.38, 1.68, 11.04, 2.06, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/fdSW39wQL_8_filtered.json b/annotations_filtered/fdSW39wQL_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e796520a06b1b5abdb3ba9ce65452b2754e1af81 --- /dev/null +++ b/annotations_filtered/fdSW39wQL_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.57], [26.0, 30.81], [34.0, 39.88], [47.0, 51.33], [51.0, 51.36], [55.0, 56.4], [66.0, 66.9], [87.0, 90.53], [91.0, 102.64], [116.0, 118.45], [121.0, 123.28], [125.0, 125.44]], "keep_status": [false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 55.67, 33.49, 41.54, 0.0, 0.0, 0.0, 39.91, 42.06, 99.82, 98.51, 0.0], "audiomae_on_audioset": [null, null, [["speech", 52.83], ["animal", 5.41], ["buzz", 3.45]], [["speech", 21.13], ["fly, housefly", 18.69], ["insect", 13.47]], null, null, null, [["chant", 31.27], ["mantra", 10.88], ["music", 10.59]], [["speech", 81.39], ["music", 6.41], ["musical instrument", 2.06]], null, null, null], "duration": [0.57, 4.81, 5.88, 4.33, 0.36, 1.4, 0.9, 3.53, 11.64, 2.45, 2.28, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/fdrR3NbPARs_filtered.json b/annotations_filtered/fdrR3NbPARs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7faba9b2f0462861087224bfb7ce239467ba3c1e --- /dev/null +++ b/annotations_filtered/fdrR3NbPARs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [16.0, 16.66], [19.0, 20.97], [26.0, 26.37], [35.0, 35.83], [43.0, 47.28], [48.0, 49.23], [53.0, 53.91], [55.0, 55.43], [59.0, 60.37], [63.0, 64.61], [67.0, 67.66], [82.0, 82.34], [108.0, 108.58], [109.0, 109.41], [118.0, 121.32], [122.0, 122.49], [125.0, 129.24], [132.0, 132.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.7, 0.0, 36.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 34.96], ["vehicle", 10.59], ["motorcycle", 5.84]], null, null, null, null, null, null, null, null, null, [["bang", 8.73], ["whack, thwack", 6.93], ["explosion", 6.59]], null, [["music", 41.65], ["throbbing", 12.09], ["whack, thwack", 11.27]], null], "duration": [0.47, 0.66, 1.97, 0.37, 0.83, 4.28, 1.23, 0.91, 0.43, 1.37, 1.61, 0.66, 0.34, 0.58, 0.41, 3.32, 0.49, 4.24, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/feeIOZH7wr4_filtered.json b/annotations_filtered/feeIOZH7wr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8c95a119f7ae1d3c0e3c9c7b691089a51465d39 --- /dev/null +++ b/annotations_filtered/feeIOZH7wr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [6.0, 6.4], [14.0, 15.13], [17.0, 17.52], [56.0, 55.83], [58.0, 59.07], [69.0, 69.4], [72.0, 72.22], [77.0, 77.58], [87.0, 88.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.4, 1.13, 0.52, -0.17, 1.07, 0.4, 0.22, 0.58, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/fegOYb4_PSk_filtered.json b/annotations_filtered/fegOYb4_PSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cca285b134cd25edd9d71c0614a8bac914d9ac0 --- /dev/null +++ b/annotations_filtered/fegOYb4_PSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.38], [23.0, 24.81], [26.0, 27.28], [36.0, 36.0], [39.0, 39.02], [40.0, 45.28], [52.0, 52.62], [54.0, 55.98], [57.0, 57.15], [58.0, 68.89], [69.0, 75.36], [76.0, 80.38], [86.0, 89.28], [92.0, 92.16], [106.0, 106.79], [109.0, 114.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [61.47, 0.0, 0.0, 0.0, 0.0, 42.79, 0.0, 0.0, 0.0, 32.63, 38.28, 46.64, 54.7, 0.0, 0.0, 84.43], "audiomae_on_audioset": [null, null, null, null, null, [["music", 67.15], ["electronic music", 4.89], ["synthesizer", 2.7]], null, null, null, [["music", 47.76], ["synthesizer", 12.63], ["hum", 11.76]], [["music", 32.87], ["throbbing", 22.49], ["hum", 8.68]], [["music", 33.52], ["throbbing", 15.49], ["hum", 12.65]], null, null, null, null], "duration": [20.38, 1.81, 1.28, 0.0, 0.02, 5.28, 0.62, 1.98, 0.15, 10.89, 6.36, 4.38, 3.28, 0.16, 0.79, 5.4]} \ No newline at end of file diff --git a/annotations_filtered/ffR1X6gndvo_filtered.json b/annotations_filtered/ffR1X6gndvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0393db3dcc69cee5185d67485d338573795e2607 --- /dev/null +++ b/annotations_filtered/ffR1X6gndvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 7.4], [9.0, 9.91], [10.0, 11.72], [13.0, 14.13], [18.0, 18.1], [22.0, 23.82], [25.0, 25.07], [27.0, 27.94], [30.0, 30.94], [33.0, 43.98], [46.0, 47.07], [51.0, 51.76], [53.0, 52.91], [56.0, 57.5], [62.0, 62.97], [66.0, 66.29], [68.0, 68.64], [73.0, 73.53], [77.0, 77.36], [81.0, 80.99], [83.0, 101.12], [101.0, 105.95], [106.0, 112.28], [113.0, 115.84], [117.0, 118.56], [119.0, 119.4], [119.0, 119.94], [121.0, 121.63], [126.0, 126.66], [127.0, 128.16], [130.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.52, 99.99, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 2.4, 0.91, 1.72, 1.13, 0.1, 1.82, 0.07, 0.94, 0.94, 10.98, 1.07, 0.76, -0.09, 1.5, 0.97, 0.29, 0.64, 0.53, 0.36, -0.01, 18.12, 4.95, 6.28, 2.84, 1.56, 0.4, 0.94, 0.63, 0.66, 1.16, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/ffknf2fIpiY_filtered.json b/annotations_filtered/ffknf2fIpiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16abd547edf6abc87a6d93e5a404d782c9eecff9 --- /dev/null +++ b/annotations_filtered/ffknf2fIpiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.13], [27.0, 27.45], [28.0, 33.37], [35.0, 36.68], [38.0, 38.18], [38.0, 40.91], [42.0, 46.16], [47.0, 47.83], [48.0, 48.56], [50.0, 63.91], [65.0, 65.03], [65.0, 70.06], [71.0, 76.52], [77.0, 79.02], [80.0, 79.79], [80.0, 81.19], [84.0, 84.45], [87.0, 90.48], [91.0, 90.98], [92.0, 93.7]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.73, 0.0, 0.0, 38.17, 40.01, 0.0, 0.0, 45.14, 0.0, 48.02, 48.14, 51.6, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 61.21], ["sidetone", 22.53], ["telephone", 8.84]], [["speech", 45.39], ["grunt", 5.54], ["burping, eructation", 3.67]], null, null, [["sidetone", 12.07], ["speech", 9.22], ["radio", 8.65]], null, [["speech", 58.33], ["sidetone", 8.12], ["radio", 7.55]], [["crushing", 41.49], ["bouncing", 25.04], ["thunk", 6.3]], null, null, null, null, null, null, null], "duration": [1.13, 0.45, 5.37, 1.68, 0.18, 2.91, 4.16, 0.83, 0.56, 13.91, 0.03, 5.06, 5.52, 2.02, -0.21, 1.19, 0.45, 3.48, -0.02, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/ffmSFNEG6pM_filtered.json b/annotations_filtered/ffmSFNEG6pM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e343dbba815487713d11b4701698e0a64399fdfc --- /dev/null +++ b/annotations_filtered/ffmSFNEG6pM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.11], [40.0, 73.57], [76.0, 100.09], [100.0, 131.06], [134.0, 138.28], [139.0, 148.49], [149.0, 149.89], [152.0, 168.39], [170.0, 170.77]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.87, 0.0, 57.48, 29.57, 0.0, 51.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.12], ["throbbing", 8.86], ["didgeridoo", 6.45]], null, null, [["speech", 71.41], ["music", 8.56], ["rumble", 8.33]], null, null, null], "duration": [1.11, 33.57, 24.09, 31.06, 4.28, 9.49, 0.89, 16.39, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/fg-43OlaJtE_filtered.json b/annotations_filtered/fg-43OlaJtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e117cbc6080452ed87220af47cc815584716b2 --- /dev/null +++ b/annotations_filtered/fg-43OlaJtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.54], [12.0, 14.76], [17.0, 19.25], [21.0, 24.8], [27.0, 29.15], [31.0, 31.65], [35.0, 36.02], [37.0, 37.52], [39.0, 39.68], [41.0, 45.98], [48.0, 50.41], [53.0, 53.91], [55.0, 57.4], [58.0, 62.07], [65.0, 66.39], [70.0, 72.13], [73.0, 76.98], [78.0, 85.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.92, 100.0, 95.51, 98.86, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.99, 99.91, 0.0, 99.52, 99.76, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.54, 2.76, 2.25, 3.8, 2.15, 0.65, 1.02, 0.52, 0.68, 4.98, 2.41, 0.91, 2.4, 4.07, 1.39, 2.13, 3.98, 7.02]} \ No newline at end of file diff --git a/annotations_filtered/fg58hVEY5Og_filtered.json b/annotations_filtered/fg58hVEY5Og_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0706dc64ae82f31923e43b8676bc2818e9c01b49 --- /dev/null +++ b/annotations_filtered/fg58hVEY5Og_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.03], [9.0, 18.3], [21.0, 30.38], [32.0, 32.43], [35.0, 36.12], [37.0, 38.3], [40.0, 42.13], [43.0, 46.16], [48.0, 49.5], [53.0, 53.72], [61.0, 61.25], [63.0, 64.12], [66.0, 67.44], [76.0, 76.08], [81.0, 82.48], [90.0, 92.72], [93.0, 106.64], [107.0, 108.26], [109.0, 109.8], [112.0, 113.78], [116.0, 118.34], [118.0, 126.4]], "keep_status": [true, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [47.35, 29.94, 30.15, 0.0, 0.0, 0.0, 30.46, 30.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.68, 33.35, 0.0, 0.0, 0.0, 30.06, 28.82], "audiomae_on_audioset": [[["hum", 31.77], ["mains hum", 22.39], ["noise", 7.0]], [["music", 26.46], ["speech", 19.61], ["sidetone", 19.47]], [["speech", 47.03], ["music", 30.05], ["buzz", 2.7]], null, null, null, [["music", 27.72], ["speech", 27.04], ["vehicle", 6.41]], [["speech", 24.03], ["music", 22.45], ["vehicle", 3.69]], null, null, null, null, null, null, null, [["throbbing", 29.49], ["music", 26.94], ["hum", 19.66]], [["music", 43.54], ["hum", 16.33], ["mains hum", 14.7]], null, null, null, [["music", 52.45], ["noise", 6.63], ["civil defense siren", 3.4]], [["music", 43.18], ["speech", 28.36], ["sidetone", 4.19]]], "duration": [2.03, 9.3, 9.38, 0.43, 1.12, 1.3, 2.13, 3.16, 1.5, 0.72, 0.25, 1.12, 1.44, 0.08, 1.48, 2.72, 13.64, 1.26, 0.8, 1.78, 2.34, 8.4]} \ No newline at end of file diff --git a/annotations_filtered/fgDgZGePcwk_filtered.json b/annotations_filtered/fgDgZGePcwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0939206360eae6556047421ba8d83125662e8ecb --- /dev/null +++ b/annotations_filtered/fgDgZGePcwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [3.0, 3.96], [4.0, 4.94], [10.0, 10.17], [14.0, 84.94], [85.0, 119.57], [121.0, 120.99]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.69, 0.96, 0.94, 0.17, 70.94, 34.57, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/fgEjlKNllEU_filtered.json b/annotations_filtered/fgEjlKNllEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adbe23ac3201ed587ff0113552d7d79320216cbb --- /dev/null +++ b/annotations_filtered/fgEjlKNllEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 36.19], [38.0, 39.23], [42.0, 44.88], [48.0, 51.49], [56.0, 58.55], [61.0, 61.62], [63.0, 63.81], [64.0, 64.71], [65.0, 66.07], [67.0, 67.24], [68.0, 68.35], [69.0, 71.31], [74.0, 75.05], [77.0, 78.38], [79.0, 79.95], [80.0, 82.24], [85.0, 85.51], [90.0, 95.79], [97.0, 102.98], [104.0, 106.12], [109.0, 115.45], [116.0, 117.07], [118.0, 118.79], [120.0, 120.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 0.0, 89.19, 82.25, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 98.99, 0.0, 99.97, 98.36, 86.45, 60.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.19, 1.23, 2.88, 3.49, 2.55, 0.62, 0.81, 0.71, 1.07, 0.24, 0.35, 2.31, 1.05, 1.38, 0.95, 2.24, 0.51, 5.79, 5.98, 2.12, 6.45, 1.07, 0.79, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/fgJ2CaTfaxU_filtered.json b/annotations_filtered/fgJ2CaTfaxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75498d418a5b992188cc033dae0e52a3ee70ae50 --- /dev/null +++ b/annotations_filtered/fgJ2CaTfaxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.56], [17.0, 18.17], [28.0, 29.39], [54.0, 54.92], [58.0, 61.23], [66.0, 66.61], [72.0, 72.33], [73.0, 75.0], [88.0, 88.6], [92.0, 93.73], [99.0, 101.43], [103.0, 103.91], [106.0, 106.57], [108.0, 110.93], [111.0, 111.0], [112.0, 112.51], [113.0, 114.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 92.31, 0.0, 0.0, 94.22, 0.0, 0.0, 41.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 14.91], ["fly, housefly", 13.5], ["whale vocalization", 7.81]], null, null, null], "duration": [1.56, 1.17, 1.39, 0.92, 3.23, 0.61, 0.33, 2.0, 0.6, 1.73, 2.43, 0.91, 0.57, 2.93, 0.0, 0.51, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/fgPFXXhzBCE_filtered.json b/annotations_filtered/fgPFXXhzBCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3c226078568c4d0e3ed4840d2133a3d8fd20dd --- /dev/null +++ b/annotations_filtered/fgPFXXhzBCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [6.0, 6.47], [13.0, 14.18], [15.0, 15.96], [18.0, 19.62], [22.0, 26.57], [28.0, 28.32], [29.0, 30.54], [33.0, 36.88], [38.0, 44.27], [45.0, 45.49], [47.0, 48.17], [49.0, 50.26], [51.0, 52.73], [54.0, 56.02], [59.0, 59.54], [61.0, 61.32], [65.0, 66.46], [71.0, 71.83], [72.0, 73.06], [76.0, 81.95], [85.0, 84.99], [85.0, 85.73], [86.0, 87.12], [88.0, 87.93], [89.0, 89.41], [90.0, 91.81], [93.0, 93.95], [100.0, 103.3], [104.0, 104.87], [107.0, 106.84], [109.0, 108.85], [110.0, 112.9], [114.0, 114.86], [116.0, 116.78], [118.0, 118.71], [120.0, 121.27], [131.0, 131.97], [133.0, 133.71], [135.0, 137.1], [139.0, 140.66], [142.0, 143.58], [144.0, 144.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 98.01, 82.61, 0.0, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 0.0, 0.0, 35.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 33.66], ["speech", 30.83], ["fart", 4.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.47, 1.18, 0.96, 1.62, 4.57, 0.32, 1.54, 3.88, 6.27, 0.49, 1.17, 1.26, 1.73, 2.02, 0.54, 0.32, 1.46, 0.83, 1.06, 5.95, -0.01, 0.73, 1.12, -0.07, 0.41, 1.81, 0.95, 3.3, 0.87, -0.16, -0.15, 2.9, 0.86, 0.78, 0.71, 1.27, 0.97, 0.71, 2.1, 1.66, 1.58, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/fgbjvvCPa88_filtered.json b/annotations_filtered/fgbjvvCPa88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b68c0cc217a26d824dfc4f21100a08e7ce2f5074 --- /dev/null +++ b/annotations_filtered/fgbjvvCPa88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.78], [17.0, 19.31], [20.0, 24.88], [29.0, 29.08], [30.0, 39.48], [41.0, 41.45], [45.0, 45.44], [50.0, 50.68], [54.0, 54.53], [55.0, 61.42], [68.0, 68.55], [74.0, 74.88], [80.0, 81.35], [82.0, 83.98], [86.0, 91.71], [93.0, 97.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 54.04, 29.68, 0.0, 28.75, 0.0, 0.0, 0.0, 0.0, 46.15, 0.0, 0.0, 0.0, 0.0, 36.12, 30.6], "audiomae_on_audioset": [null, null, [["music", 66.65], ["speech", 9.76], ["vehicle", 3.53]], null, [["hum", 52.73], ["throbbing", 32.29], ["mains hum", 6.15]], null, null, null, null, [["music", 34.87], ["speech", 16.55], ["musical instrument", 5.11]], null, null, null, null, [["speech", 53.27], ["music", 11.93], ["animal", 3.11]], [["noise", 48.25], ["mains hum", 12.57], ["hum", 9.0]]], "duration": [0.78, 2.31, 4.88, 0.08, 9.48, 0.45, 0.44, 0.68, 0.53, 6.42, 0.55, 0.88, 1.35, 1.98, 5.71, 4.5]} \ No newline at end of file diff --git a/annotations_filtered/fgcWfVvT_UM_filtered.json b/annotations_filtered/fgcWfVvT_UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e405e7b0a4b44b11688427a94b60ac03c8cfb112 --- /dev/null +++ b/annotations_filtered/fgcWfVvT_UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.32], [11.0, 20.82], [23.0, 22.99], [38.0, 39.65], [45.0, 45.12], [62.0, 62.01], [70.0, 70.17], [72.0, 72.0], [73.0, 73.87], [75.0, 76.18], [89.0, 89.09], [90.0, 91.29], [97.0, 97.11], [98.0, 98.36], [108.0, 108.53], [112.0, 112.48], [113.0, 114.52]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 22.59], ["mechanisms", 20.67], ["rumble", 14.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 9.82, -0.01, 1.65, 0.12, 0.01, 0.17, 0.0, 0.87, 1.18, 0.09, 1.29, 0.11, 0.36, 0.53, 0.48, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/fhK8qpO-iD4_filtered.json b/annotations_filtered/fhK8qpO-iD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86f6c45157dfaef64e2a98493e5fbd2cc6d055e7 --- /dev/null +++ b/annotations_filtered/fhK8qpO-iD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.33], [5.0, 5.91], [6.0, 9.39], [11.0, 10.86], [12.0, 12.63], [15.0, 16.23], [18.0, 18.23], [19.0, 42.72], [44.0, 47.46], [53.0, 53.65], [55.0, 60.59], [61.0, 64.23], [66.0, 66.21], [68.0, 70.44], [74.0, 74.78], [78.0, 80.7], [81.0, 83.29], [90.0, 90.27], [93.0, 94.9], [105.0, 105.51], [110.0, 113.17], [115.0, 116.21], [117.0, 116.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 30.22, 60.51, 0.0, 99.99, 91.13, 0.0, 79.94, 0.0, 67.51, 47.43, 0.0, 0.0, 0.0, 32.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 77.44], ["throbbing", 4.87], ["hum", 2.27]], null, null, null, null, null, null, null, null, [["music", 65.39], ["musical instrument", 3.37], ["synthesizer", 3.24]], null, null, null, [["music", 60.98], ["throbbing", 15.01], ["hum", 4.98]], null, null], "duration": [1.33, 0.91, 3.39, -0.14, 0.63, 1.23, 0.23, 23.72, 3.46, 0.65, 5.59, 3.23, 0.21, 2.44, 0.78, 2.7, 2.29, 0.27, 1.9, 0.51, 3.17, 1.21, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/fhO2QtGb8tY_filtered.json b/annotations_filtered/fhO2QtGb8tY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a7a50b7e085e3a807a1a2f6140b85a7b4e5423f --- /dev/null +++ b/annotations_filtered/fhO2QtGb8tY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.92], [14.0, 41.15], [43.0, 43.6], [46.0, 48.61], [55.0, 56.05], [58.0, 60.05], [62.0, 64.83], [65.0, 65.43]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 100.0, 0.0, 94.52, 53.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.92, 27.15, 0.6, 2.61, 1.05, 2.05, 2.83, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/fhUXu7x66BA_filtered.json b/annotations_filtered/fhUXu7x66BA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8be5c5cd631f5d70a89c17f7e623e12628f02757 --- /dev/null +++ b/annotations_filtered/fhUXu7x66BA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.26], [6.0, 6.0], [7.0, 9.96], [11.0, 11.1], [11.0, 11.69], [32.0, 33.94], [34.0, 36.19], [41.0, 41.44], [43.0, 43.5], [44.0, 44.52], [46.0, 46.47], [47.0, 47.63], [49.0, 49.32], [50.0, 51.06], [55.0, 57.35], [72.0, 95.45], [98.0, 99.39], [107.0, 109.04], [111.0, 111.82], [115.0, 115.77], [126.0, 126.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [98.86, 0.0, 99.98, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 99.96, 0.0, 47.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.66], ["hum", 3.0], ["vehicle", 2.6]], null, null, null], "duration": [2.26, 0.0, 2.96, 0.1, 0.69, 1.94, 2.19, 0.44, 0.5, 0.52, 0.47, 0.63, 0.32, 1.06, 2.35, 23.45, 1.39, 2.04, 0.82, 0.77, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/fi7cppyGPPw_filtered.json b/annotations_filtered/fi7cppyGPPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc6f9f2c73938b031d1fbdfc9bbc2ab83213dbca --- /dev/null +++ b/annotations_filtered/fi7cppyGPPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.32], [19.0, 20.39], [21.0, 21.91], [28.0, 28.73], [34.0, 35.11], [38.0, 38.18], [39.0, 41.32], [45.0, 45.54], [48.0, 48.51], [51.0, 51.33], [53.0, 54.4], [55.0, 55.75], [56.0, 60.1], [61.0, 61.11], [64.0, 65.04], [66.0, 67.14], [71.0, 71.98], [75.0, 75.17], [76.0, 76.27], [79.0, 85.63], [91.0, 94.26], [102.0, 163.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 37.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.44, 47.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.93], ["fart", 9.46], ["inside, small room", 2.43]], null, null, null, null, null, null, [["speech", 92.89], ["burst, pop", 1.06], ["explosion", 1.0]], [["fart", 39.03], ["speech", 27.45], ["clip-clop", 5.89]], null], "duration": [1.32, 1.39, 0.91, 0.73, 1.11, 0.18, 2.32, 0.54, 0.51, 0.33, 1.4, 0.75, 4.1, 0.11, 1.04, 1.14, 0.98, 0.17, 0.27, 6.63, 3.26, 61.07]} \ No newline at end of file diff --git a/annotations_filtered/fiqJGHbv3ys_filtered.json b/annotations_filtered/fiqJGHbv3ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6cdba2996c145455ced88d84d7f4d570fe6405e --- /dev/null +++ b/annotations_filtered/fiqJGHbv3ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 36.36], [37.0, 44.25], [50.0, 57.6], [59.0, 60.79], [63.0, 63.24], [63.0, 63.27], [63.0, 63.31], [63.0, 63.41], [63.0, 63.58], [66.0, 65.84], [73.0, 72.71], [73.0, 72.74], [81.0, 81.99], [84.0, 85.31], [88.0, 89.41], [98.0, 105.83]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.93, 38.36, 34.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.74], "audiomae_on_audioset": [[["speech", 76.63], ["music", 1.87], ["animal", 1.42]], [["speech", 34.03], ["fart", 21.82], ["radio", 8.1]], [["speech", 27.17], ["sidetone", 19.51], ["throbbing", 5.48]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.61], ["hum", 17.57], ["mains hum", 7.77]]], "duration": [5.36, 7.25, 7.6, 1.79, 0.24, 0.27, 0.31, 0.41, 0.58, -0.16, -0.29, -0.26, 0.99, 1.31, 1.41, 7.83]} \ No newline at end of file diff --git a/annotations_filtered/fiziIJ6zTU8_filtered.json b/annotations_filtered/fiziIJ6zTU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32aa5dfad35347dbcd276f576f6102e6fe72ea1e --- /dev/null +++ b/annotations_filtered/fiziIJ6zTU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 42.85], [43.0, 66.95], [69.0, 123.3], [124.0, 124.44], [125.0, 125.32]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 31.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.55], ["speech", 9.37], ["electronic music", 4.25]], null, null, null], "duration": [0.85, 23.95, 54.3, 0.44, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/fjAnmRjjY3E_filtered.json b/annotations_filtered/fjAnmRjjY3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..457f1d2ce170a1775c5dd7cde34edee74b7dcda8 --- /dev/null +++ b/annotations_filtered/fjAnmRjjY3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.47], [11.0, 24.09], [26.0, 39.5], [40.0, 94.07]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 28.63, 28.62, 0.0], "audiomae_on_audioset": [null, [["speech", 65.23], ["music", 18.87], ["whack, thwack", 3.94]], [["music", 35.79], ["throbbing", 17.37], ["hum", 7.58]], null], "duration": [1.47, 13.09, 13.5, 54.07]} \ No newline at end of file diff --git a/annotations_filtered/fjVyrWdUy0c_filtered.json b/annotations_filtered/fjVyrWdUy0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63bfe2ea8102ab4fdcf4c4650880e0edb0ac2970 --- /dev/null +++ b/annotations_filtered/fjVyrWdUy0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [6.0, 6.91], [10.0, 11.33], [21.0, 21.12], [23.0, 23.43], [27.0, 26.82], [28.0, 30.0], [33.0, 33.2], [41.0, 42.09], [53.0, 59.14], [61.0, 61.52], [63.0, 63.59], [68.0, 72.33], [80.0, 80.55], [81.0, 86.43], [96.0, 103.42], [103.0, 103.5], [104.0, 107.84], [111.0, 111.06], [114.0, 114.12], [118.0, 118.44], [121.0, 122.3], [123.0, 123.92]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 47.74, 0.0, 0.0, 99.59, 0.0, 97.22, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 40.65], ["speech", 15.26], ["thunk", 4.41]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.91, 1.33, 0.12, 0.43, -0.18, 2.0, 0.2, 1.09, 6.14, 0.52, 0.59, 4.33, 0.55, 5.43, 7.42, 0.5, 3.84, 0.06, 0.12, 0.44, 1.3, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/fjodt2JnWT8_filtered.json b/annotations_filtered/fjodt2JnWT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2efd4f1fcd15bcbbe9aa6df45d9139a294201750 --- /dev/null +++ b/annotations_filtered/fjodt2JnWT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.0], [18.0, 18.15], [19.0, 20.53], [22.0, 25.73], [28.0, 30.47], [32.0, 34.69], [36.0, 36.39], [37.0, 38.97], [40.0, 42.18], [49.0, 50.52], [55.0, 56.89], [70.0, 70.5], [75.0, 76.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.29, 90.6, 89.19, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.15, 1.53, 3.73, 2.47, 2.69, 0.39, 1.97, 2.18, 1.52, 1.89, 0.5, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/fjsZJkL1lB4_filtered.json b/annotations_filtered/fjsZJkL1lB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad08d72aef8e56909216042603a827136f3137c8 --- /dev/null +++ b/annotations_filtered/fjsZJkL1lB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.46], [29.0, 84.92], [86.0, 87.71], [90.0, 95.0], [97.0, 111.35], [115.0, 115.48], [119.0, 137.59], [139.0, 138.7], [141.0, 143.56], [146.0, 148.68], [150.0, 151.83], [152.0, 152.83]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.99, 31.55, 0.0, 33.2, 0.0, 34.48, 49.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 24.92], ["electric shaver, electric razor", 18.18], ["speech", 16.81]], null, [["music", 57.53], ["musical instrument", 10.81], ["didgeridoo", 8.04]], null, [["music", 40.98], ["speech", 18.2], ["croak", 6.64]], [["music", 20.06], ["whale vocalization", 19.78], ["speech", 15.47]], null, null], "duration": [0.46, 55.92, 1.71, 5.0, 14.35, 0.48, 18.59, -0.3, 2.56, 2.68, 1.83, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/fjzcBqz2Cpk_filtered.json b/annotations_filtered/fjzcBqz2Cpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..782aa552139498c3905d8c56b57de7d69ea95db6 --- /dev/null +++ b/annotations_filtered/fjzcBqz2Cpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.32], [23.0, 30.42], [37.0, 41.47], [43.0, 44.98], [46.0, 58.09], [61.0, 62.99], [65.0, 69.67], [72.0, 80.72], [82.0, 83.71], [84.0, 88.7], [89.0, 93.46], [95.0, 98.02], [99.0, 101.22], [103.0, 105.68], [108.0, 121.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.81, 55.18, 64.29, 0.0, 80.82, 0.0, 97.73, 88.83, 0.0, 77.87, 92.48, 89.19, 97.73, 91.98, 58.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.32, 7.42, 4.47, 1.98, 12.09, 1.99, 4.67, 8.72, 1.71, 4.7, 4.46, 3.02, 2.22, 2.68, 13.88]} \ No newline at end of file diff --git a/annotations_filtered/fk0O_cdBbMg_filtered.json b/annotations_filtered/fk0O_cdBbMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9423c7c2a9dc3927ce7c29d05e3b303794c2fd60 --- /dev/null +++ b/annotations_filtered/fk0O_cdBbMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [10.0, 10.37], [15.0, 16.5], [17.0, 18.35], [19.0, 41.39], [52.0, 52.29], [57.0, 57.75], [61.0, 64.15], [65.0, 93.38], [94.0, 96.08], [106.0, 106.68], [108.0, 110.22], [111.0, 120.18], [125.0, 126.71], [131.0, 131.67], [132.0, 141.59], [143.0, 147.5], [156.0, 156.09], [159.0, 159.65], [160.0, 159.97], [167.0, 175.02], [185.0, 185.73]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 55.53, 33.77, 33.74, 0.0, 77.87, 48.31, 0.0, 0.0, 36.46, 32.76, 0.0, 0.0, 0.0, 31.54, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 62.56], ["didgeridoo", 10.05], ["musical instrument", 5.06]], null, null, null, [["music", 29.54], ["speech", 23.55], ["livestock, farm animals, working animals", 10.6]], [["fly, housefly", 25.89], ["mosquito", 19.18], ["insect", 10.25]], null, null, [["music", 65.29], ["carnatic music", 3.9], ["livestock, farm animals, working animals", 3.25]], null, null, [["music", 63.16], ["speech", 16.9], ["didgeridoo", 6.51]], [["cattle, bovinae", 23.44], ["moo", 21.64], ["livestock, farm animals, working animals", 19.66]], null, null, null, [["sheep", 28.19], ["speech", 20.49], ["bleat", 10.14]], null], "duration": [1.13, 0.37, 1.5, 1.35, 22.39, 0.29, 0.75, 3.15, 28.38, 2.08, 0.68, 2.22, 9.18, 1.71, 0.67, 9.59, 4.5, 0.09, 0.65, -0.03, 8.02, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/fk2MU617-Bc_filtered.json b/annotations_filtered/fk2MU617-Bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af17ce31a7c2b29300ffb5e57ce610fd3ec298f3 --- /dev/null +++ b/annotations_filtered/fk2MU617-Bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.42], [17.0, 17.09], [18.0, 18.93], [20.0, 20.63], [23.0, 24.38], [28.0, 28.32], [31.0, 33.32], [34.0, 40.9], [41.0, 43.6], [44.0, 46.5], [47.0, 48.39], [49.0, 51.63], [57.0, 57.33], [61.0, 61.65], [62.0, 63.85], [65.0, 69.53]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 34.49, 99.21, 99.48, 0.0, 84.98, 0.0, 0.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 17.92], ["speech", 14.83], ["explosion", 5.31]], null, null, null, null, null, null, null, null], "duration": [5.42, 0.09, 0.93, 0.63, 1.38, 0.32, 2.32, 6.9, 2.6, 2.5, 1.39, 2.63, 0.33, 0.65, 1.85, 4.53]} \ No newline at end of file diff --git a/annotations_filtered/fk7GWw7MagU_filtered.json b/annotations_filtered/fk7GWw7MagU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8b8c2eff0b0e6ee0615c04f43c1fefa1f3628de --- /dev/null +++ b/annotations_filtered/fk7GWw7MagU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.72], [8.0, 12.06], [13.0, 14.79], [16.0, 18.06], [21.0, 21.98], [23.0, 24.63], [27.0, 29.93], [31.0, 31.6], [32.0, 33.34], [34.0, 36.63], [41.0, 42.4], [47.0, 48.27], [49.0, 49.72], [50.0, 56.35], [57.0, 59.64], [61.0, 61.05], [62.0, 62.68], [65.0, 66.26], [73.0, 75.51], [78.0, 78.95], [83.0, 84.03], [87.0, 89.88], [94.0, 95.59], [96.0, 111.33], [114.0, 121.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.09, 0.0, 87.37, 0.0, 0.0, 89.72, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 91.81, 72.31, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 42.69, 0.0, 62.17, 43.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.6], ["sidetone", 15.98], ["tuning fork", 6.28]], null, null, [["music", 73.52], ["synthesizer", 5.19], ["ambient music", 2.7]]], "duration": [1.72, 4.06, 1.79, 2.06, 0.98, 1.63, 2.93, 0.6, 1.34, 2.63, 1.4, 1.27, 0.72, 6.35, 2.64, 0.05, 0.68, 1.26, 2.51, 0.95, 1.03, 2.88, 1.59, 15.33, 7.53]} \ No newline at end of file diff --git a/annotations_filtered/fkHlhiG0h70_filtered.json b/annotations_filtered/fkHlhiG0h70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42d89d98d8c6e4e7b4100430998c7322c6e587fa --- /dev/null +++ b/annotations_filtered/fkHlhiG0h70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 50.95], [51.0, 51.49], [52.0, 59.0], [63.0, 71.49], [73.0, 77.7], [80.0, 84.28], [86.0, 86.44], [90.0, 92.53], [96.0, 97.61]], "keep_status": [false, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 36.8, 35.55, 38.7, 29.07, 0.0, 42.51, 0.0], "audiomae_on_audioset": [null, null, [["frog", 31.91], ["radio", 29.18], ["mosquito", 4.74]], [["mosquito", 16.46], ["whale vocalization", 15.36], ["hum", 12.74]], [["mains hum", 50.27], ["hum", 31.15], ["fly, housefly", 2.06]], [["mains hum", 35.3], ["hum", 28.01], ["fly, housefly", 15.42]], null, [["mains hum", 19.4], ["hum", 17.19], ["frog", 7.81]], null], "duration": [-0.05, 0.49, 7.0, 8.49, 4.7, 4.28, 0.44, 2.53, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/fki-LTswICw_filtered.json b/annotations_filtered/fki-LTswICw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1919d7f1496682667b8ccae882914c2e296675c9 --- /dev/null +++ b/annotations_filtered/fki-LTswICw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [8.0, 12.85], [16.0, 33.83], [37.0, 38.65], [44.0, 45.17], [49.0, 51.68], [52.0, 60.67], [61.0, 83.88], [84.0, 84.28], [90.0, 114.12], [129.0, 131.03], [133.0, 133.78], [139.0, 142.15], [144.0, 158.8], [159.0, 160.57]], "keep_status": [false, true, true, false, false, true, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 43.74, 30.56, 0.0, 0.0, 38.72, 43.85, 31.24, 0.0, 30.16, 46.43, 0.0, 30.19, 30.15, 0.0], "audiomae_on_audioset": [null, [["music", 26.34], ["synthesizer", 9.79], ["hum", 8.51]], [["music", 39.24], ["boing", 18.46], ["speech", 4.45]], null, null, [["music", 30.29], ["speech", 18.84], ["sidetone", 9.58]], [["music", 65.65], ["speech", 3.65], ["hum", 3.04]], [["music", 70.6], ["throbbing", 6.65], ["electronic music", 4.53]], null, [["music", 50.11], ["synthesizer", 5.48], ["sampler", 4.64]], [["music", 38.97], ["synthesizer", 9.23], ["musical instrument", 6.72]], null, [["throbbing", 30.77], ["music", 28.09], ["hum", 26.39]], [["speech", 34.58], ["music", 26.99], ["throbbing", 7.15]], null], "duration": [0.98, 4.85, 17.83, 1.65, 1.17, 2.68, 8.67, 22.88, 0.28, 24.12, 2.03, 0.78, 3.15, 14.8, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/fkiY6TBT4mo_filtered.json b/annotations_filtered/fkiY6TBT4mo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..010e2910f1ff5e642da0b72deb4d7f7be711bca1 --- /dev/null +++ b/annotations_filtered/fkiY6TBT4mo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.59], [2.0, 2.88], [4.0, 4.7], [5.0, 6.67], [8.0, 13.9], [15.0, 15.3], [16.0, 29.73], [33.0, 33.0], [34.0, 35.26], [38.0, 38.8], [40.0, 40.95], [42.0, 42.85], [47.0, 48.02], [50.0, 49.98], [52.0, 52.83], [57.0, 58.16], [61.0, 62.41], [64.0, 66.24], [67.0, 73.6], [74.0, 76.82], [79.0, 81.46], [83.0, 82.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.72, 0.0, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 72.46, 61.18, 85.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.41, 0.88, 0.7, 1.67, 5.9, 0.3, 13.73, 0.0, 1.26, 0.8, 0.95, 0.85, 1.02, -0.02, 0.83, 1.16, 1.41, 2.24, 6.6, 2.82, 2.46, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/fls3z7Me2Dc_filtered.json b/annotations_filtered/fls3z7Me2Dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69c8e34d12a7c5f27ae2ca5ce19ab89289cc039a --- /dev/null +++ b/annotations_filtered/fls3z7Me2Dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [4.0, 5.16], [20.0, 20.98], [22.0, 22.65], [25.0, 26.3], [42.0, 42.43], [48.0, 51.22], [52.0, 61.11], [61.0, 61.23], [66.0, 68.86], [73.0, 73.99], [75.0, 77.21], [79.0, 80.16], [84.0, 86.07], [92.0, 92.99], [96.0, 97.01], [99.0, 99.08], [102.0, 103.32], [104.0, 105.31], [107.0, 109.53], [115.0, 115.89], [117.0, 119.1], [126.0, 126.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 43.3, 0.0, 86.82, 0.0, 75.07, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 49.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 69.04], ["electric shaver, electric razor", 15.62], ["fart", 3.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.45], ["sidetone", 5.15], ["music", 4.77]], null], "duration": [0.62, 1.16, 0.98, 0.65, 1.3, 0.43, 3.22, 9.11, 0.23, 2.86, 0.99, 2.21, 1.16, 2.07, 0.99, 1.01, 0.08, 1.32, 1.31, 2.53, 0.89, 2.1, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/fltSq_QHbbk_filtered.json b/annotations_filtered/fltSq_QHbbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a077232cfcaf7576e2ea3de1f7af1e1860f88587 --- /dev/null +++ b/annotations_filtered/fltSq_QHbbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 59.32], [61.0, 82.19]], "keep_status": [true, true], "silence_prob": [32.77, 37.27], "audiomae_on_audioset": [[["stomach rumble", 32.81], ["radio", 11.27], ["hum", 8.85]], [["music", 18.37], ["synthesizer", 10.91], ["didgeridoo", 8.23]]], "duration": [17.32, 21.19]} \ No newline at end of file diff --git a/annotations_filtered/fluJSCbNpDM_filtered.json b/annotations_filtered/fluJSCbNpDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..157b39fad3dabad74713d5182f5284bc591653d2 --- /dev/null +++ b/annotations_filtered/fluJSCbNpDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [11.0, 11.97], [15.0, 18.96], [23.0, 25.39], [30.0, 31.06], [32.0, 33.79], [34.0, 46.97], [49.0, 51.66], [61.0, 61.45], [65.0, 67.26], [69.0, 76.92], [78.0, 79.46], [81.0, 82.73], [86.0, 86.39], [88.0, 92.2], [93.0, 103.25], [105.0, 116.04], [120.0, 120.68], [124.0, 124.73], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.88, 79.07, 0.0, 0.0, 51.94, 58.22, 0.0, 95.23, 76.04, 0.0, 0.0, 0.0, 73.82, 83.88, 89.01, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.97, 3.96, 2.39, 1.06, 1.79, 12.97, 2.66, 0.45, 2.26, 7.92, 1.46, 1.73, 0.39, 4.2, 10.25, 11.04, 0.68, 0.73, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/flvyCwagnF0_filtered.json b/annotations_filtered/flvyCwagnF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38fe78d7a3003f7640d4cf61aa15436356273032 --- /dev/null +++ b/annotations_filtered/flvyCwagnF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.15], [4.0, 5.04], [6.0, 6.61], [10.0, 10.98], [13.0, 13.1], [13.0, 13.95], [14.0, 14.88], [17.0, 18.15], [19.0, 22.77], [24.0, 29.84], [33.0, 37.86], [44.0, 44.47], [51.0, 55.22], [56.0, 56.54], [58.0, 59.02], [65.0, 66.38], [68.0, 68.89], [72.0, 77.6], [78.0, 80.4], [86.0, 87.83], [89.0, 91.56], [94.0, 97.92], [99.0, 99.35], [101.0, 101.17], [103.0, 103.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.85, 87.55, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 96.89, 99.1, 0.0, 98.99, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 1.04, 0.61, 0.98, 0.1, 0.95, 0.88, 1.15, 3.77, 5.84, 4.86, 0.47, 4.22, 0.54, 1.02, 1.38, 0.89, 5.6, 2.4, 1.83, 2.56, 3.92, 0.35, 0.17, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/fmIaHAtabSU_filtered.json b/annotations_filtered/fmIaHAtabSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0448ced7dbbdd26d1a7d8c862ef47d4e486b6af4 --- /dev/null +++ b/annotations_filtered/fmIaHAtabSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 116.34]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [67.34]} \ No newline at end of file diff --git a/annotations_filtered/fmMPmWO6b4E_filtered.json b/annotations_filtered/fmMPmWO6b4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1001f034c14273c33524713e05854e1825f5c9 --- /dev/null +++ b/annotations_filtered/fmMPmWO6b4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 101.33], [103.0, 127.48], [129.0, 151.29]], "keep_status": [false, true, true], "silence_prob": [0.0, 33.17, 31.71], "audiomae_on_audioset": [null, [["music", 44.09], ["throbbing", 10.47], ["whack, thwack", 8.66]], [["music", 29.21], ["whack, thwack", 23.64], ["mosquito", 8.59]]], "duration": [92.33, 24.48, 22.29]} \ No newline at end of file diff --git a/annotations_filtered/fmRWWrBqiJE_filtered.json b/annotations_filtered/fmRWWrBqiJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adfaf2292993cdd4caa7bcb438a4d3ca6a2ffc53 --- /dev/null +++ b/annotations_filtered/fmRWWrBqiJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.36], [17.0, 26.5], [27.0, 28.49], [32.0, 38.45], [42.0, 66.56], [68.0, 85.11], [87.0, 86.95], [87.0, 87.4], [89.0, 89.77], [91.0, 161.03], [166.0, 166.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.44, 94.95, 0.0, 74.76, 91.81, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [11.36, 9.5, 1.49, 6.45, 24.56, 17.11, -0.05, 0.4, 0.77, 70.03, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/fmT8JstRohg_filtered.json b/annotations_filtered/fmT8JstRohg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ca4529d6a2af6dadbe06e2e22ea35ae993546d --- /dev/null +++ b/annotations_filtered/fmT8JstRohg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [4.0, 4.75], [27.0, 27.99], [36.0, 36.64]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [1.25, 0.75, 0.99, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/fn5dXUu_qxM_filtered.json b/annotations_filtered/fn5dXUu_qxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c987772d9f4be6d4dd929ea39e052a2e3a2cabe --- /dev/null +++ b/annotations_filtered/fn5dXUu_qxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 43.87], [45.0, 46.52], [51.0, 52.1], [53.0, 54.01], [54.0, 61.37], [62.0, 62.33], [67.0, 68.79], [79.0, 82.09], [85.0, 84.57], [85.0, 85.06], [87.0, 89.38], [91.0, 94.69], [97.0, 97.46], [101.0, 104.11], [107.0, 107.64], [108.0, 109.49], [116.0, 116.8], [120.0, 120.21], [131.0, 132.49], [133.0, 134.7], [136.0, 138.91], [143.0, 144.68], [147.0, 150.13], [151.0, 152.19], [153.0, 154.6], [179.0, 180.64], [183.0, 184.38], [217.0, 217.54], [219.0, 219.6], [224.0, 224.46], [227.0, 227.65], [230.0, 229.78], [235.0, 235.74], [237.0, 239.8], [240.0, 240.58], [252.0, 252.0], [253.0, 253.84], [259.0, 261.32], [265.0, 265.4], [266.0, 266.72]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.31, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 44.81, 0.0, 0.0, 95.09, 91.64, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0], "audiomae_on_audioset": [[["insect", 26.21], ["fly, housefly", 22.97], ["mosquito", 15.69]], null, null, null, [["hum", 34.82], ["mains hum", 20.05], ["dishes, pots, and pans", 4.92]], null, null, [["speech", 39.63], ["whale vocalization", 13.57], ["chirp tone", 7.68]], null, null, null, null, null, [["speech", 24.16], ["hum", 20.31], ["mains hum", 14.24]], null, null, null, null, null, null, [["speech", 43.18], ["music", 13.03], ["electronic music", 3.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.87, 1.52, 1.1, 1.01, 7.37, 0.33, 1.79, 3.09, -0.43, 0.06, 2.38, 3.69, 0.46, 3.11, 0.64, 1.49, 0.8, 0.21, 1.49, 1.7, 2.91, 1.68, 3.13, 1.19, 1.6, 1.64, 1.38, 0.54, 0.6, 0.46, 0.65, -0.22, 0.74, 2.8, 0.58, 0.0, 0.84, 2.32, 0.4, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/fnF1_aVlIio_filtered.json b/annotations_filtered/fnF1_aVlIio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..647c858980afa33a5deee43e6f287904d21c7be7 --- /dev/null +++ b/annotations_filtered/fnF1_aVlIio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.76], [12.0, 12.88], [14.0, 15.97], [17.0, 18.99], [19.0, 21.15], [22.0, 23.79], [24.0, 28.51], [30.0, 35.95], [37.0, 37.84], [42.0, 43.68], [46.0, 46.55], [48.0, 48.36], [49.0, 49.35], [51.0, 51.49], [53.0, 53.62], [55.0, 55.63], [57.0, 58.48], [61.0, 62.53], [64.0, 66.09], [70.0, 84.79], [86.0, 132.0]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 40.7, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 68.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 60.68], ["busy signal", 15.35], ["sidetone", 3.92]], [["heart sounds, heartbeat", 14.8], ["throbbing", 13.32], ["hum", 12.47]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.24, 0.88, 1.97, 1.99, 2.15, 1.79, 4.51, 5.95, 0.84, 1.68, 0.55, 0.36, 0.35, 0.49, 0.62, 0.63, 1.48, 1.53, 2.09, 14.79, 46.0]} \ No newline at end of file diff --git a/annotations_filtered/fnH1ZtugoqU_filtered.json b/annotations_filtered/fnH1ZtugoqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..899375fabccffc65260e21b2a7eaa3f18d58b497 --- /dev/null +++ b/annotations_filtered/fnH1ZtugoqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 86.81], [87.0, 90.53], [91.0, 91.44], [93.0, 97.56], [100.0, 108.14]], "keep_status": [false, true, false, false, false], "silence_prob": [40.11, 36.97, 0.0, 38.11, 37.85], "audiomae_on_audioset": [[["music", 55.02], ["theremin", 33.23], ["synthesizer", 2.64]], [["music", 34.18], ["theremin", 13.53], ["synthesizer", 9.27]], null, [["music", 70.32], ["synthesizer", 7.02], ["musical instrument", 4.2]], [["music", 60.12], ["theremin", 10.93], ["musical instrument", 7.72]]], "duration": [5.81, 3.53, 0.44, 4.56, 8.14]} \ No newline at end of file diff --git a/annotations_filtered/fnTckzsYgg0_filtered.json b/annotations_filtered/fnTckzsYgg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c53a915c1e63700385acaa20b4bc211da47bba1 --- /dev/null +++ b/annotations_filtered/fnTckzsYgg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 46.23], [53.0, 69.57], [70.0, 79.29]], "keep_status": [false, false, true], "silence_prob": [0.0, 36.61, 35.56], "audiomae_on_audioset": [null, [["music", 53.02], ["speech", 11.19], ["theremin", 8.34]], [["music", 27.08], ["civil defense siren", 8.13], ["hum", 6.88]]], "duration": [37.23, 16.57, 9.29]} \ No newline at end of file diff --git a/annotations_filtered/fniTZP_4V1M_filtered.json b/annotations_filtered/fniTZP_4V1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22c7c05920e16e6817fa21852754e0447860b583 --- /dev/null +++ b/annotations_filtered/fniTZP_4V1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.61], [27.0, 28.9], [35.0, 40.2], [41.0, 52.78], [54.0, 54.24], [55.0, 55.76], [57.0, 57.37], [59.0, 63.34], [66.0, 66.24], [67.0, 67.93], [69.0, 68.91], [74.0, 76.28], [77.0, 77.04], [77.0, 78.16], [80.0, 80.45], [82.0, 81.9], [84.0, 84.3], [93.0, 93.11], [95.0, 96.31], [101.0, 102.17], [105.0, 105.68]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.93, 85.72, 0.0, 0.0, 0.0, 47.98, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 24.83], ["moo", 22.81], ["speech", 18.42]], null, null, null, null, [["speech", 93.7], ["radio", 1.12], ["inside, small room", 0.54]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 1.9, 5.2, 11.78, 0.24, 0.76, 0.37, 4.34, 0.24, 0.93, -0.09, 2.28, 0.04, 1.16, 0.45, -0.1, 0.3, 0.11, 1.31, 1.17, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/fnpUxSXWy6I_filtered.json b/annotations_filtered/fnpUxSXWy6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c1fe33c38e6a080dbaa6b6faeb1aa0fee585c9 --- /dev/null +++ b/annotations_filtered/fnpUxSXWy6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.75], [15.0, 15.03], [15.0, 15.99], [18.0, 18.1], [21.0, 21.12], [27.0, 27.53], [29.0, 28.93], [32.0, 32.66], [55.0, 55.58], [57.0, 57.69], [59.0, 59.49], [60.0, 64.59], [71.0, 71.83], [73.0, 72.94], [74.0, 74.98], [75.0, 77.31], [78.0, 78.98], [85.0, 84.99], [104.0, 104.41], [104.0, 105.9], [106.0, 107.81], [111.0, 111.4], [117.0, 118.18], [119.0, 120.9], [122.0, 123.67], [130.0, 141.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.03, 0.99, 0.1, 0.12, 0.53, -0.07, 0.66, 0.58, 0.69, 0.49, 4.59, 0.83, -0.06, 0.98, 2.31, 0.98, -0.01, 0.41, 1.9, 1.81, 0.4, 1.18, 1.9, 1.67, 11.2]} \ No newline at end of file diff --git a/annotations_filtered/fo0KBFhChFU_filtered.json b/annotations_filtered/fo0KBFhChFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..840163d9fba73610c449db64fbd5e40d611d97ea --- /dev/null +++ b/annotations_filtered/fo0KBFhChFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.76], [13.0, 13.73], [17.0, 17.14], [19.0, 20.06], [21.0, 25.51], [27.0, 27.36], [31.0, 32.02], [33.0, 80.27], [82.0, 90.73]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.24, 0.0, 0.0, 0.0, 32.6], "audiomae_on_audioset": [null, null, null, null, [["music", 29.42], ["hum", 16.5], ["throbbing", 11.04]], null, null, null, [["music", 47.85], ["speech", 22.97], ["throbbing", 4.47]]], "duration": [0.76, 0.73, 0.14, 1.06, 4.51, 0.36, 1.02, 47.27, 8.73]} \ No newline at end of file diff --git a/annotations_filtered/foPh0pXXq-A_filtered.json b/annotations_filtered/foPh0pXXq-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a724a58cca52b1da0d10541a808b88bd8b9076f --- /dev/null +++ b/annotations_filtered/foPh0pXXq-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.2], [10.0, 14.82], [20.0, 21.17], [42.0, 44.1]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 38.43, 0.0, 100.0], "audiomae_on_audioset": [null, [["speech", 64.47], ["music", 4.81], ["explosion", 4.4]], null, null], "duration": [1.2, 4.82, 1.17, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/foQnR1eZO-Y_filtered.json b/annotations_filtered/foQnR1eZO-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dca8d6a91d2765959797122d525f7f15b732da2a --- /dev/null +++ b/annotations_filtered/foQnR1eZO-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [4.0, 3.86], [12.0, 12.72], [15.0, 15.43], [17.0, 17.93], [20.0, 20.09], [21.0, 22.0], [25.0, 31.31], [33.0, 34.48], [37.0, 38.13], [38.0, 43.93], [45.0, 48.03], [49.0, 49.67], [50.0, 50.19], [61.0, 63.21], [64.0, 64.89], [68.0, 68.27], [69.0, 71.31], [77.0, 82.9], [85.0, 84.97], [92.0, 91.93], [95.0, 95.82], [105.0, 106.47], [110.0, 110.62], [112.0, 113.07], [117.0, 117.81], [128.0, 129.32], [133.0, 134.7], [138.0, 138.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 42.79, 53.16, 0.0, 0.0, 70.3, 0.0, 0.0, 49.45, 33.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["cough", 19.87], ["speech", 18.83], ["music", 7.78]], null, null, null, null, null, null, [["whale vocalization", 23.58], ["speech", 23.39], ["hum", 7.98]], [["music", 84.67], ["musical instrument", 3.6], ["guitar", 1.98]], null, null, null, null, null, null, null, null, null, null], "duration": [0.15, -0.14, 0.72, 0.43, 0.93, 0.09, 1.0, 6.31, 1.48, 1.13, 5.93, 3.03, 0.67, 0.19, 2.21, 0.89, 0.27, 2.31, 5.9, -0.03, -0.07, 0.82, 1.47, 0.62, 1.07, 0.81, 1.32, 1.7, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/foV6LGohzBI_filtered.json b/annotations_filtered/foV6LGohzBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b12869198bddbf047e8a6aa503997a40e5dd6ebe --- /dev/null +++ b/annotations_filtered/foV6LGohzBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.32], [28.0, 29.93], [31.0, 44.79], [50.0, 53.87], [61.0, 64.34], [72.0, 74.63], [81.0, 85.41], [106.0, 109.81], [115.0, 131.7], [133.0, 158.09], [159.0, 191.39], [193.0, 208.67]], "keep_status": [false, false, false, false, true, false, true, true, false, true, false, true], "silence_prob": [40.28, 0.0, 35.05, 38.12, 42.84, 38.04, 35.91, 28.85, 29.13, 28.99, 0.0, 28.77], "audiomae_on_audioset": [[["humming", 83.85], ["theremin", 7.14], ["music", 6.58]], null, [["music", 59.83], ["humming", 19.68], ["theremin", 5.13]], [["music", 71.04], ["theremin", 8.75], ["musical instrument", 2.86]], [["music", 50.8], ["guitar", 3.93], ["plucked string instrument", 3.8]], [["music", 48.73], ["carnatic music", 25.66], ["singing", 4.45]], [["music", 49.86], ["tabla", 11.09], ["carnatic music", 6.56]], [["music", 34.5], ["carnatic music", 20.01], ["tabla", 5.86]], [["music", 93.93], ["singing", 0.68], ["didgeridoo", 0.49]], [["music", 64.8], ["singing", 2.44], ["didgeridoo", 1.61]], null, [["music", 58.58], ["gospel music", 3.65], ["didgeridoo", 3.41]]], "duration": [16.32, 1.93, 13.79, 3.87, 3.34, 2.63, 4.41, 3.81, 16.7, 25.09, 32.39, 15.67]} \ No newline at end of file diff --git a/annotations_filtered/foll8sDGq4M_filtered.json b/annotations_filtered/foll8sDGq4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..624dc20492fc82860ab440a975f659efbb3d667c --- /dev/null +++ b/annotations_filtered/foll8sDGq4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 17.29], [20.0, 31.01], [34.0, 49.37], [49.0, 49.42], [50.0, 61.84]], "keep_status": [true, false, false, false, true], "silence_prob": [32.25, 32.3, 32.21, 0.0, 34.14], "audiomae_on_audioset": [[["music", 43.68], ["speech", 20.13], ["whack, thwack", 5.44]], [["music", 69.72], ["didgeridoo", 3.93], ["speech", 3.2]], [["music", 52.27], ["speech", 22.43], ["fart", 3.61]], null, [["music", 34.02], ["boing", 16.69], ["whack, thwack", 9.33]]], "duration": [13.29, 11.01, 15.37, 0.42, 11.84]} \ No newline at end of file diff --git a/annotations_filtered/fp86WZ7Jn5g_filtered.json b/annotations_filtered/fp86WZ7Jn5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e956815234d54f445cb3c18bd6ac9907d255257d --- /dev/null +++ b/annotations_filtered/fp86WZ7Jn5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.06], [8.0, 9.63], [10.0, 12.23], [13.0, 16.19], [17.0, 18.62], [22.0, 23.4], [25.0, 28.78], [33.0, 33.42], [35.0, 34.89], [39.0, 40.85], [42.0, 43.61], [44.0, 44.42], [47.0, 47.33], [48.0, 49.99], [52.0, 55.09], [56.0, 58.45], [60.0, 61.18], [63.0, 63.34], [64.0, 67.15], [69.0, 70.01], [70.0, 72.23], [73.0, 75.2], [78.0, 80.35], [82.0, 83.83], [89.0, 90.26], [93.0, 93.19], [95.0, 94.95], [96.0, 101.16], [102.0, 102.47], [104.0, 104.85], [109.0, 109.43], [112.0, 111.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.37, 0.0, 99.21, 99.99, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.9, 0.0, 0.0, 99.56, 0.0, 98.99, 99.93, 96.77, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.06, 1.63, 2.23, 3.19, 1.62, 1.4, 3.78, 0.42, -0.11, 1.85, 1.61, 0.42, 0.33, 1.99, 3.09, 2.45, 1.18, 0.34, 3.15, 1.01, 2.23, 2.2, 2.35, 1.83, 1.26, 0.19, -0.05, 5.16, 0.47, 0.85, 0.43, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/fpE3kI1HOWQ_filtered.json b/annotations_filtered/fpE3kI1HOWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60550349d70647888459064644c2151e31a89523 --- /dev/null +++ b/annotations_filtered/fpE3kI1HOWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.78], [5.0, 5.64], [7.0, 8.65], [10.0, 11.03], [13.0, 14.13], [31.0, 31.38], [33.0, 33.84], [35.0, 35.53], [55.0, 55.22], [57.0, 57.2], [60.0, 62.29], [77.0, 77.08], [79.0, 80.01], [81.0, 81.7], [83.0, 83.51], [85.0, 85.04], [98.0, 97.8], [98.0, 99.5], [103.0, 103.08], [107.0, 107.6], [110.0, 110.46], [113.0, 113.97], [116.0, 117.14], [118.0, 118.81], [120.0, 120.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.64, 1.65, 1.03, 1.13, 0.38, 0.84, 0.53, 0.22, 0.2, 2.29, 0.08, 1.01, 0.7, 0.51, 0.04, -0.2, 1.5, 0.08, 0.6, 0.46, 0.97, 1.14, 0.81, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/fpK36FZmTFY_filtered.json b/annotations_filtered/fpK36FZmTFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1ce36b899971538e8cca21b348ce58ff0f49ab8 --- /dev/null +++ b/annotations_filtered/fpK36FZmTFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.21], [25.0, 25.19], [26.0, 27.19], [28.0, 28.8], [29.0, 33.44], [79.0, 80.57], [81.0, 82.41], [95.0, 99.59], [100.0, 100.33], [101.0, 131.31], [132.0, 141.1], [143.0, 147.38], [148.0, 152.44], [154.0, 154.04], [159.0, 159.09], [167.0, 167.02], [171.0, 171.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 99.99, 0.0, 0.0, 83.52, 98.1, 99.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 79.36], ["sidetone", 3.72], ["radio", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.19, 1.19, 0.8, 4.44, 1.57, 1.41, 4.59, 0.33, 30.31, 9.1, 4.38, 4.44, 0.04, 0.09, 0.02, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/fpKl9lrLfx0_filtered.json b/annotations_filtered/fpKl9lrLfx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1c4a6b1a28fa2c59da2da0981ee1f77ba63ff08 --- /dev/null +++ b/annotations_filtered/fpKl9lrLfx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.34], [8.0, 9.15], [16.0, 22.03], [29.0, 30.42], [49.0, 60.42], [64.0, 68.52], [70.0, 91.37], [93.0, 106.35], [109.0, 124.51], [125.0, 128.87]], "keep_status": [false, false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.1, 0.0, 30.85, 40.11, 34.2, 32.33, 33.48, 35.37], "audiomae_on_audioset": [null, null, [["fly, housefly", 18.59], ["speech", 13.28], ["mosquito", 9.27]], null, [["music", 40.53], ["livestock, farm animals, working animals", 14.9], ["fly, housefly", 7.1]], [["music", 53.46], ["theremin", 20.86], ["synthesizer", 8.44]], [["music", 63.28], ["musical instrument", 6.47], ["throbbing", 4.25]], [["fly, housefly", 27.38], ["hum", 14.17], ["music", 11.88]], [["speech", 53.01], ["music", 26.38], ["whack, thwack", 2.55]], [["music", 43.11], ["theremin", 39.42], ["musical instrument", 3.22]]], "duration": [1.34, 1.15, 6.03, 1.42, 11.42, 4.52, 21.37, 13.35, 15.51, 3.87]} \ No newline at end of file diff --git a/annotations_filtered/fpLdP56W3do_filtered.json b/annotations_filtered/fpLdP56W3do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9c587d20a1e7a5eed8b764de598468c4b621f8 --- /dev/null +++ b/annotations_filtered/fpLdP56W3do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.8], [11.0, 21.86], [23.0, 31.87], [32.0, 32.44], [37.0, 38.21], [39.0, 38.8], [41.0, 45.86], [47.0, 49.05], [50.0, 50.82], [51.0, 51.0], [51.0, 51.33], [51.0, 52.62], [53.0, 52.66], [53.0, 53.81], [55.0, 60.39], [62.0, 63.15], [64.0, 65.08], [72.0, 72.42], [86.0, 102.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 99.16, 0.0, 0.0, 0.0, 86.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 71.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 10.86, 8.87, 0.44, 1.21, -0.2, 4.86, 2.05, 0.82, 0.0, 0.33, 1.62, -0.34, 0.81, 5.39, 1.15, 1.08, 0.42, 16.03]} \ No newline at end of file diff --git a/annotations_filtered/fpXngRB-VTw_filtered.json b/annotations_filtered/fpXngRB-VTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fc243a6f72ae2d3eecf8e3a5b1992a3b2528539 --- /dev/null +++ b/annotations_filtered/fpXngRB-VTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.72], [8.0, 7.94], [10.0, 11.16], [20.0, 21.0], [22.0, 23.13], [30.0, 31.56], [36.0, 36.58], [40.0, 43.02], [45.0, 44.96], [47.0, 50.43]], "keep_status": [false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 30.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 24.18], ["music", 10.76], ["throbbing", 8.78]], null, [["whale vocalization", 20.87], ["mains hum", 14.06], ["hum", 12.6]]], "duration": [0.72, -0.06, 1.16, 1.0, 1.13, 1.56, 0.58, 3.02, -0.04, 3.43]} \ No newline at end of file diff --git a/annotations_filtered/fpiyrd28vfA_filtered.json b/annotations_filtered/fpiyrd28vfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26c86c9f8d96468d57a925cc8f83938177b1d58d --- /dev/null +++ b/annotations_filtered/fpiyrd28vfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 29.88], [85.0, 96.25], [99.0, 101.58], [103.0, 105.54], [107.0, 108.35], [109.0, 112.13], [115.0, 115.91], [117.0, 118.29], [119.0, 120.66], [123.0, 127.16], [129.0, 129.64], [130.0, 130.6], [133.0, 133.61], [134.0, 134.69], [140.0, 140.91], [159.0, 159.34], [162.0, 162.7], [166.0, 165.96], [167.0, 166.99], [173.0, 175.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.35, 38.59, 71.57, 50.46, 0.0, 98.36, 0.0, 0.0, 0.0, 40.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.1], "audiomae_on_audioset": [[["throbbing", 33.04], ["music", 30.98], ["hum", 19.11]], [["speech", 87.12], ["fart", 7.81], ["stomach rumble", 1.91]], null, null, null, null, null, null, null, [["grunt", 84.7], ["speech", 7.95], ["groan", 0.92]], null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 39.09], ["moo", 29.45], ["cattle, bovinae", 29.29]]], "duration": [3.88, 11.25, 2.58, 2.54, 1.35, 3.13, 0.91, 1.29, 1.66, 4.16, 0.64, 0.6, 0.61, 0.69, 0.91, 0.34, 0.7, -0.04, -0.01, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/fpnoVKmulZM_filtered.json b/annotations_filtered/fpnoVKmulZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07854c4a9084fa82dd217aaf539cca95177b22f0 --- /dev/null +++ b/annotations_filtered/fpnoVKmulZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.63], [24.0, 30.81], [32.0, 31.63], [33.0, 37.17], [45.0, 45.17], [46.0, 48.25], [90.0, 92.62], [95.0, 100.2], [101.0, 100.99], [104.0, 105.04], [105.0, 110.84], [111.0, 111.54], [113.0, 114.0], [115.0, 119.4], [122.0, 128.26], [129.0, 129.36]], "keep_status": [false, false, false, true, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.94, 0.0, 33.51, 0.0, 33.22, 32.8, 33.37, 0.0, 0.0, 33.79, 0.0, 0.0, 34.01, 35.54, 0.0], "audiomae_on_audioset": [null, [["music", 57.54], ["drum machine", 6.61], ["speech", 6.44]], null, [["music", 49.68], ["speech", 8.88], ["electronic music", 4.96]], null, [["music", 42.04], ["speech", 22.9], ["throbbing", 4.58]], [["music", 25.68], ["speech", 20.27], ["boing", 17.81]], [["music", 66.88], ["quack", 10.43], ["sampler", 1.67]], null, null, [["music", 57.29], ["synthesizer", 6.3], ["drum machine", 4.38]], null, null, [["music", 67.46], ["speech", 4.8], ["drum machine", 3.58]], [["music", 59.33], ["drum machine", 8.76], ["sampler", 4.44]], null], "duration": [1.63, 6.81, -0.37, 4.17, 0.17, 2.25, 2.62, 5.2, -0.01, 1.04, 5.84, 0.54, 1.0, 4.4, 6.26, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/fpwM2-jDwQU_filtered.json b/annotations_filtered/fpwM2-jDwQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7cc2edacd01fc3236fc3d041d2266d2bda6579 --- /dev/null +++ b/annotations_filtered/fpwM2-jDwQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 37.42], [44.0, 44.85], [50.0, 50.38], [51.0, 52.86], [59.0, 65.69], [66.0, 65.94], [66.0, 66.01], [67.0, 68.4], [76.0, 76.94], [88.0, 87.83], [96.0, 96.7], [100.0, 103.44], [112.0, 114.91], [117.0, 119.79], [125.0, 126.62], [129.0, 132.0], [135.0, 134.96], [139.0, 151.71], [153.0, 154.97], [156.0, 155.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [31.79, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 31.32, 37.85, 0.0, 51.77, 0.0, 36.05, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 77.6], ["beatboxing", 5.53], ["boing", 2.56]], null, null, null, [["speech", 76.83], ["mains hum", 4.4], ["electric shaver, electric razor", 3.54]], null, null, null, null, null, null, [["whack, thwack", 50.74], ["breaking", 18.13], ["smash, crash", 7.32]], [["speech", 29.62], ["music", 28.26], ["boing", 10.88]], [["music", 26.87], ["hum", 24.04], ["mains hum", 15.14]], null, null, null, [["music", 33.68], ["hum", 22.64], ["mains hum", 13.88]], null, null], "duration": [2.42, 0.85, 0.38, 1.86, 6.69, -0.06, 0.01, 1.4, 0.94, -0.17, 0.7, 3.44, 2.91, 2.79, 1.62, 3.0, -0.04, 12.71, 1.97, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/fpxPstb2DAU_filtered.json b/annotations_filtered/fpxPstb2DAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0939028c66e8a08475d877662cf40c0e625456dc --- /dev/null +++ b/annotations_filtered/fpxPstb2DAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [5.0, 6.81], [7.0, 9.19], [11.0, 10.96], [54.0, 54.8], [59.0, 59.34], [63.0, 65.69], [68.0, 69.38], [71.0, 71.61], [72.0, 73.2], [74.0, 75.47], [78.0, 77.8], [79.0, 80.03], [81.0, 81.03], [83.0, 84.74], [90.0, 91.72], [94.0, 95.99], [96.0, 97.41], [103.0, 103.37], [105.0, 105.92], [107.0, 107.65], [109.0, 110.4], [111.0, 134.62], [135.0, 135.28], [135.0, 145.88], [151.0, 169.72], [174.0, 176.69], [177.0, 177.62], [178.0, 178.56], [180.0, 180.17], [183.0, 183.39], [184.0, 185.13], [186.0, 194.0], [196.0, 196.4], [203.0, 217.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 37.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 30.62, 31.43, 33.81, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 0.0, 30.17], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 78.68], ["throbbing", 6.39], ["techno", 1.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.36], ["music", 15.58], ["horse", 4.31]], null, [["music", 53.89], ["brass instrument", 8.52], ["trombone", 6.36]], [["livestock, farm animals, working animals", 41.0], ["music", 17.04], ["moo", 13.82]], [["cattle, bovinae", 23.9], ["livestock, farm animals, working animals", 21.74], ["cowbell", 21.65]], null, null, null, null, null, [["music", 40.63], ["speech", 16.24], ["livestock, farm animals, working animals", 10.03]], null, [["music", 37.63], ["fart", 6.59], ["speech", 4.67]]], "duration": [0.48, 1.81, 2.19, -0.04, 0.8, 0.34, 2.69, 1.38, 0.61, 1.2, 1.47, -0.2, 1.03, 0.03, 1.74, 1.72, 1.99, 1.41, 0.37, 0.92, 0.65, 1.4, 23.62, 0.28, 10.88, 18.72, 2.69, 0.62, 0.56, 0.17, 0.39, 1.13, 8.0, 0.4, 14.7]} \ No newline at end of file diff --git a/annotations_filtered/fq5JFon-LOs_filtered.json b/annotations_filtered/fq5JFon-LOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15fb2dda16d91627722bdaab10e551cb38725c33 --- /dev/null +++ b/annotations_filtered/fq5JFon-LOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [2.0, 2.62], [4.0, 4.85], [7.0, 7.26], [8.0, 8.56], [9.0, 9.66], [11.0, 12.82], [27.0, 27.43], [29.0, 30.1], [31.0, 31.85], [34.0, 34.3], [45.0, 45.08], [46.0, 45.76], [48.0, 48.86], [55.0, 55.02], [56.0, 56.27], [58.0, 59.12], [60.0, 60.62], [79.0, 79.32], [82.0, 82.58], [87.0, 87.67], [89.0, 89.36], [90.0, 90.34], [92.0, 97.46], [98.0, 98.88], [100.0, 100.97], [105.0, 105.17], [107.0, 108.89], [113.0, 114.2], [119.0, 119.15], [120.0, 119.99], [121.0, 121.12], [125.0, 125.37], [127.0, 127.16], [128.0, 129.14], [130.0, 130.5], [134.0, 134.82], [135.0, 135.53], [140.0, 140.16], [141.0, 140.91], [142.0, 141.69], [148.0, 147.83], [149.0, 148.93], [153.0, 153.06], [160.0, 161.03], [168.0, 170.28], [173.0, 173.25], [176.0, 176.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.08], ["music", 30.73], ["thunk", 4.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 17.74], ["speech", 12.15], ["animal", 7.43]], null, null], "duration": [0.51, 0.62, 0.85, 0.26, 0.56, 0.66, 1.82, 0.43, 1.1, 0.85, 0.3, 0.08, -0.24, 0.86, 0.02, 0.27, 1.12, 0.62, 0.32, 0.58, 0.67, 0.36, 0.34, 5.46, 0.88, 0.97, 0.17, 1.89, 1.2, 0.15, -0.01, 0.12, 0.37, 0.16, 1.14, 0.5, 0.82, 0.53, 0.16, -0.09, -0.31, -0.17, -0.07, 0.06, 1.03, 2.28, 0.25, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/fqKdFZ1jKMY_filtered.json b/annotations_filtered/fqKdFZ1jKMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3050ff85e2e6cd13bfb0506e86e79ded70adeb20 --- /dev/null +++ b/annotations_filtered/fqKdFZ1jKMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.36], [13.0, 14.93], [16.0, 20.76], [24.0, 24.09], [26.0, 26.3], [29.0, 29.17], [41.0, 42.33], [48.0, 49.49], [51.0, 53.84], [57.0, 59.86], [64.0, 65.31], [69.0, 71.39], [75.0, 75.76], [77.0, 81.72], [84.0, 92.21], [95.0, 96.67], [98.0, 111.21], [115.0, 118.83], [120.0, 123.16], [125.0, 128.24], [129.0, 132.16], [136.0, 136.17], [140.0, 141.03], [144.0, 153.35], [154.0, 154.85], [155.0, 159.76], [160.0, 159.97]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [34.07, 0.0, 33.02, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 33.38, 0.0, 31.39, 0.0, 31.46, 30.18, 0.0, 29.78, 31.91, 35.78, 30.08, 32.85, 0.0, 0.0, 29.7, 0.0, 28.76, 0.0], "audiomae_on_audioset": [[["music", 49.91], ["throbbing", 20.36], ["frog", 4.3]], null, [["music", 47.04], ["speech", 21.13], ["propeller, airscrew", 2.33]], null, null, null, null, null, null, [["music", 26.96], ["speech", 20.65], ["throbbing", 6.4]], null, [["speech", 64.37], ["music", 10.0], ["vehicle", 4.44]], null, [["fly, housefly", 45.33], ["insect", 39.59], ["mosquito", 10.77]], [["music", 81.21], ["didgeridoo", 5.36], ["musical instrument", 3.4]], null, [["music", 36.96], ["speech", 11.21], ["groan", 6.96]], [["music", 64.42], ["speech", 19.44], ["throbbing", 1.14]], [["music", 63.62], ["throbbing", 2.79], ["sampler", 2.64]], [["speech", 43.16], ["music", 24.47], ["whack, thwack", 6.41]], [["music", 78.63], ["creak", 4.52], ["grunt", 4.27]], null, null, [["music", 73.84], ["speech", 16.62], ["electronic music", 1.43]], null, [["music", 33.03], ["speech", 22.94], ["hum", 15.15]], null], "duration": [9.36, 1.93, 4.76, 0.09, 0.3, 0.17, 1.33, 1.49, 2.84, 2.86, 1.31, 2.39, 0.76, 4.72, 8.21, 1.67, 13.21, 3.83, 3.16, 3.24, 3.16, 0.17, 1.03, 9.35, 0.85, 4.76, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/fqM1ttqNA9k_filtered.json b/annotations_filtered/fqM1ttqNA9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d666b2c9532dd4adfa39b97302ff9914981d65c7 --- /dev/null +++ b/annotations_filtered/fqM1ttqNA9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.63], [9.0, 9.81], [12.0, 12.78], [15.0, 28.97], [33.0, 33.59], [47.0, 68.2], [70.0, 69.87], [70.0, 70.78], [73.0, 73.67], [76.0, 76.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.35, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 70.67], ["crying, sobbing", 8.14], ["groan", 3.47]], null, [["speech", 57.89], ["wail, moan", 17.95], ["whimper", 3.71]], null, null, null, null], "duration": [1.63, 0.81, 0.78, 13.97, 0.59, 21.2, -0.13, 0.78, 0.67, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/fq_QSi29iGQ_filtered.json b/annotations_filtered/fq_QSi29iGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9313365b72730e8ba1d308a0088078f6f1ca3c93 --- /dev/null +++ b/annotations_filtered/fq_QSi29iGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.63], [19.0, 19.9], [21.0, 26.05], [26.0, 26.35], [26.0, 28.14], [30.0, 31.16], [33.0, 34.11], [35.0, 34.94], [38.0, 43.87], [48.0, 48.49], [49.0, 49.44], [56.0, 56.66], [57.0, 56.73], [57.0, 61.21], [65.0, 64.89], [67.0, 67.61], [69.0, 70.23], [71.0, 72.17], [79.0, 79.81], [86.0, 88.91], [91.0, 93.66], [95.0, 95.61], [97.0, 97.73], [100.0, 104.84], [110.0, 110.2], [111.0, 112.38], [115.0, 127.94]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.39, 0.0, 41.07, 0.0, 0.0, 0.0, 46.83, 0.0, 0.0, 0.0, 0.0, 33.24, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 31.8, 0.0, 0.0, 30.27, 0.0, 0.0, 32.33], "audiomae_on_audioset": [null, null, [["music", 48.6], ["clarinet", 19.02], ["synthesizer", 6.4]], null, [["speech", 24.57], ["music", 23.77], ["theremin", 17.18]], null, null, null, [["music", 40.23], ["musical instrument", 6.98], ["organ", 6.53]], null, null, null, null, [["speech", 73.95], ["whack, thwack", 1.44], ["vehicle", 1.29]], null, null, null, null, null, [["music", 37.74], ["speech", 26.97], ["synthesizer", 7.15]], [["music", 59.7], ["theremin", 12.97], ["musical instrument", 6.18]], null, null, [["music", 33.43], ["throbbing", 22.42], ["hum", 15.39]], null, null, [["music", 62.19], ["scary music", 6.73], ["electronic music", 4.3]]], "duration": [0.63, 0.9, 5.05, 0.35, 2.14, 1.16, 1.11, -0.06, 5.87, 0.49, 0.44, 0.66, -0.27, 4.21, -0.11, 0.61, 1.23, 1.17, 0.81, 2.91, 2.66, 0.61, 0.73, 4.84, 0.2, 1.38, 12.94]} \ No newline at end of file diff --git a/annotations_filtered/fqnhqkXclUk_filtered.json b/annotations_filtered/fqnhqkXclUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5087727e2b2475d4efbe7585a9af22a9c2f70917 --- /dev/null +++ b/annotations_filtered/fqnhqkXclUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 48.91], [52.0, 51.98], [52.0, 52.02], [53.0, 66.51], [67.0, 67.31], [67.0, 67.37], [69.0, 108.57], [109.0, 112.67], [113.0, 113.48], [115.0, 119.42], [120.0, 121.2], [122.0, 122.47], [125.0, 141.66], [144.0, 170.8], [171.0, 172.44], [174.0, 174.8]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.2, 0.0, 0.0, 0.0, 37.12, 0.0, 57.48, 0.0, 0.0, 35.64, 33.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.42], ["speech", 20.04], ["didgeridoo", 4.03]], null, null, null, [["speech", 21.21], ["mosquito", 18.37], ["fly, housefly", 14.96]], null, null, null, null, [["music", 30.88], ["fireworks", 11.78], ["speech", 11.57]], [["music", 35.28], ["fly, housefly", 5.39], ["vehicle", 4.32]], null, null], "duration": [31.91, -0.02, 0.02, 13.51, 0.31, 0.37, 39.57, 3.67, 0.48, 4.42, 1.2, 0.47, 16.66, 26.8, 1.44, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/fqtFUIQ7oWA_filtered.json b/annotations_filtered/fqtFUIQ7oWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcbbec5a33df753735121bfd7a731d42f393322d --- /dev/null +++ b/annotations_filtered/fqtFUIQ7oWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 37.61], [38.0, 40.51], [42.0, 44.36], [50.0, 50.6], [53.0, 63.86], [65.0, 64.96], [67.0, 69.18], [70.0, 70.28], [73.0, 81.5], [83.0, 83.37]], "keep_status": [true, true, true, false, true, false, false, false, false, false], "silence_prob": [31.15, 34.46, 31.22, 0.0, 29.99, 0.0, 32.44, 0.0, 31.17, 0.0], "audiomae_on_audioset": [[["music", 54.74], ["theremin", 6.53], ["cacophony", 4.14]], [["music", 62.29], ["screaming", 2.56], ["musical instrument", 2.45]], [["livestock, farm animals, working animals", 14.18], ["groan", 10.82], ["music", 9.54]], null, [["grunt", 15.08], ["speech", 11.54], ["music", 11.18]], null, [["fly, housefly", 35.97], ["mosquito", 21.11], ["insect", 19.86]], null, [["speech", 33.63], ["music", 28.08], ["boing", 12.94]], null], "duration": [4.61, 2.51, 2.36, 0.6, 10.86, -0.04, 2.18, 0.28, 8.5, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/fr5rDEInWQA_filtered.json b/annotations_filtered/fr5rDEInWQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9436bf5a401575b725ffd8999a41890dc19fd226 --- /dev/null +++ b/annotations_filtered/fr5rDEInWQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.69], [31.0, 35.18], [37.0, 37.27], [39.0, 41.0], [44.0, 45.12], [46.0, 47.8], [49.0, 52.96], [53.0, 54.5], [55.0, 56.13], [57.0, 56.84], [58.0, 59.07], [61.0, 61.35], [68.0, 68.99], [69.0, 70.28], [72.0, 72.99], [73.0, 77.99], [83.0, 84.47], [86.0, 86.8], [87.0, 88.16], [89.0, 90.02], [92.0, 92.67], [94.0, 94.47], [95.0, 95.47], [97.0, 97.21], [98.0, 99.79], [104.0, 104.16], [105.0, 107.4], [108.0, 109.04], [110.0, 111.11], [112.0, 113.75], [115.0, 116.07], [121.0, 121.37], [123.0, 129.93], [133.0, 133.49], [135.0, 135.8], [139.0, 138.72], [148.0, 149.76]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 36.84, 0.0, 50.21, 0.0, 0.0, 37.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.63, 0.0, 0.0, 0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 29.09], ["brass instrument", 5.63], ["walk, footsteps", 5.41]], null, null, null, null, [["speech", 76.67], ["radio", 3.01], ["inside, small room", 1.83]], null, null, null, null, null, null, null, null, [["speech", 92.76], ["telephone", 0.64], ["beatboxing", 0.54]], null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 75.96], ["speech", 6.12], ["sound effect", 2.26]], null, null, null, null, null, [["speech", 28.26], ["dishes, pots, and pans", 10.06], ["coin (dropping)", 8.51]], null, null, null, null], "duration": [0.69, 4.18, 0.27, 2.0, 1.12, 1.8, 3.96, 1.5, 1.13, -0.16, 1.07, 0.35, 0.99, 1.28, 0.99, 4.99, 1.47, 0.8, 1.16, 1.02, 0.67, 0.47, 0.47, 0.21, 1.79, 0.16, 2.4, 1.04, 1.11, 1.75, 1.07, 0.37, 6.93, 0.49, 0.8, -0.28, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/fr93wwtiKQM_filtered.json b/annotations_filtered/fr93wwtiKQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..888a60bd2623c06bb2acb67cd2d45c9889aba7c9 --- /dev/null +++ b/annotations_filtered/fr93wwtiKQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.99], [5.0, 6.32], [7.0, 7.91], [11.0, 11.47], [14.0, 15.35], [17.0, 18.47], [21.0, 22.54], [24.0, 24.56], [26.0, 28.04], [29.0, 33.17], [34.0, 35.51], [37.0, 39.56], [41.0, 52.57], [53.0, 62.56], [66.0, 92.85], [95.0, 106.29], [108.0, 136.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.99, 63.31, 65.91, 56.63, 61.67, 31.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.96], ["hum", 8.39], ["mains hum", 7.65]]], "duration": [-0.01, 1.32, 0.91, 0.47, 1.35, 1.47, 1.54, 0.56, 2.04, 4.17, 1.51, 2.56, 11.57, 9.56, 26.85, 11.29, 28.24]} \ No newline at end of file diff --git a/annotations_filtered/frE9rXnaHpE_filtered.json b/annotations_filtered/frE9rXnaHpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/frE9rXnaHpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/frIi1u8PAlc_filtered.json b/annotations_filtered/frIi1u8PAlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c9e9262683327defae3b3ad5fc2b21fd9ed71e --- /dev/null +++ b/annotations_filtered/frIi1u8PAlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [5.0, 6.12], [8.0, 9.14], [10.0, 11.35], [12.0, 12.5], [14.0, 15.92], [18.0, 24.26], [25.0, 27.35], [27.0, 28.36], [30.0, 31.65], [33.0, 34.79], [37.0, 40.44], [41.0, 44.27], [45.0, 49.2], [50.0, 52.81], [54.0, 57.38], [60.0, 60.54], [61.0, 64.54], [65.0, 65.37], [66.0, 67.15], [67.0, 71.19], [74.0, 94.76], [96.0, 97.65], [98.0, 99.6], [101.0, 107.92], [109.0, 115.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 89.9, 99.94, 99.96, 98.73, 99.85, 0.0, 99.97, 0.0, 0.0, 98.8, 99.99, 0.0, 0.0, 99.97, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.12, 1.14, 1.35, 0.5, 1.92, 6.26, 2.35, 1.36, 1.65, 1.79, 3.44, 3.27, 4.2, 2.81, 3.38, 0.54, 3.54, 0.37, 1.15, 4.19, 20.76, 1.65, 1.6, 6.92, 6.65]} \ No newline at end of file diff --git a/annotations_filtered/frTBOhJ0XHU_filtered.json b/annotations_filtered/frTBOhJ0XHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5d8246f1091415c50e2d5518117987007a7bbc7 --- /dev/null +++ b/annotations_filtered/frTBOhJ0XHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.43], [25.0, 25.46], [26.0, 27.63], [28.0, 33.3], [34.0, 50.79], [51.0, 64.74], [73.0, 78.78], [84.0, 84.23], [86.0, 86.39], [87.0, 88.53], [89.0, 91.12], [92.0, 93.01], [94.0, 95.0], [96.0, 100.35], [101.0, 101.29], [102.0, 102.14], [103.0, 107.43], [108.0, 109.11], [111.0, 114.88]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.24, 0.0, 0.0, 63.74, 43.74, 40.68, 34.93, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 76.04, 0.0, 0.0, 81.71, 0.0, 88.64], "audiomae_on_audioset": [null, null, null, null, [["music", 54.88], ["theremin", 21.46], ["didgeridoo", 3.08]], [["music", 74.59], ["musical instrument", 4.95], ["drum", 3.9]], [["speech", 14.78], ["radio", 11.37], ["music", 9.48]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.43, 0.46, 1.63, 5.3, 16.79, 13.74, 5.78, 0.23, 0.39, 1.53, 2.12, 1.01, 1.0, 4.35, 0.29, 0.14, 4.43, 1.11, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/frV4tvni8H0_filtered.json b/annotations_filtered/frV4tvni8H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a17d3838378b6e5167c4dd6387782f23954c9d3 --- /dev/null +++ b/annotations_filtered/frV4tvni8H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.59], [16.0, 16.41], [18.0, 18.1], [23.0, 23.23], [24.0, 24.87], [27.0, 27.41], [29.0, 33.34], [36.0, 43.6], [44.0, 44.44], [45.0, 46.01], [48.0, 57.05], [63.0, 64.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.83, 0.0, 0.0, 0.0, 0.0, 0.0, 29.39, 28.83, 0.0, 0.0, 29.38, 0.0], "audiomae_on_audioset": [[["music", 61.69], ["speech", 6.77], ["sheep", 6.73]], null, null, null, null, null, [["music", 74.47], ["static", 1.93], ["didgeridoo", 1.91]], [["music", 79.03], ["static", 1.7], ["hum", 1.54]], null, null, [["music", 77.62], ["singing", 4.23], ["rhythm and blues", 1.41]], null], "duration": [3.59, 0.41, 0.1, 0.23, 0.87, 0.41, 4.34, 7.6, 0.44, 1.01, 9.05, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/frZrAIZrOI8_filtered.json b/annotations_filtered/frZrAIZrOI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c70f2e3cbe1e969c2ac72d9de33f686a499b0104 --- /dev/null +++ b/annotations_filtered/frZrAIZrOI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.66], [8.0, 8.07], [16.0, 22.45], [23.0, 24.36], [31.0, 31.41], [43.0, 42.75], [49.0, 49.28], [52.0, 52.68], [55.0, 55.51], [62.0, 62.11], [64.0, 65.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.38], ["speech", 35.03], ["musical instrument", 3.5]], null, null, null, null, null, null, null, null], "duration": [-0.34, 0.07, 6.45, 1.36, 0.41, -0.25, 0.28, 0.68, 0.51, 0.11, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/frgfTkjkcxo_filtered.json b/annotations_filtered/frgfTkjkcxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db91d2a201f4441aaf345f8c64714f039e72a248 --- /dev/null +++ b/annotations_filtered/frgfTkjkcxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 21.15], [21.0, 21.44], [24.0, 29.86], [82.0, 83.37], [93.0, 96.52], [101.0, 101.83]], "keep_status": [false, false, false, false, true, false], "silence_prob": [41.01, 0.0, 37.4, 0.0, 41.91, 0.0], "audiomae_on_audioset": [[["throbbing", 50.49], ["hum", 25.07], ["music", 11.12]], null, [["speech", 29.01], ["music", 23.63], ["throbbing", 23.11]], null, [["baby laughter", 20.33], ["snicker", 16.64], ["boing", 15.61]], null], "duration": [6.15, 0.44, 5.86, 1.37, 3.52, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/frqy8o30rv8_filtered.json b/annotations_filtered/frqy8o30rv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9dcfd88587ee4b3c32ad523e6c89e37987a447f --- /dev/null +++ b/annotations_filtered/frqy8o30rv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.04], [18.0, 18.5], [19.0, 18.54], [45.0, 46.92], [71.0, 73.01], [82.0, 84.38], [103.0, 107.1], [110.0, 114.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.64, 32.04, 33.67, 32.25], "audiomae_on_audioset": [null, null, null, null, [["music", 63.41], ["synthesizer", 5.74], ["speech", 4.28]], [["music", 63.86], ["boing", 8.47], ["sidetone", 4.58]], [["music", 60.03], ["scratching (performance technique)", 11.68], ["beatboxing", 8.09]], [["music", 59.27], ["sidetone", 7.06], ["scratching (performance technique)", 3.92]]], "duration": [0.04, 0.5, -0.46, 1.92, 2.01, 2.38, 4.1, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/fsMC6d8DeMo_filtered.json b/annotations_filtered/fsMC6d8DeMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04e2539fd70fdf2bcff6dc7eb6002b08314b0838 --- /dev/null +++ b/annotations_filtered/fsMC6d8DeMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 9.05], [9.0, 15.67], [17.0, 19.89], [21.0, 33.24], [34.0, 34.26], [38.0, 49.32], [50.0, 52.34], [53.0, 56.59], [58.0, 58.75], [60.0, 60.91], [62.0, 65.2], [66.0, 70.36], [71.0, 83.13], [84.0, 84.86], [85.0, 86.71], [87.0, 98.69], [99.0, 112.68], [113.0, 116.88], [117.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 99.99, 99.95, 100.0, 100.0, 0.0, 99.99, 99.82, 55.39, 0.0, 0.0, 100.0, 100.0, 40.22, 0.0, 0.0, 40.68, 100.0, 100.0, 37.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 25.87], ["gunshot, gunfire", 17.37], ["burst, pop", 17.28]], null, null, [["speech", 50.35], ["sine wave", 7.1], ["explosion", 5.5]], null, null, [["music", 64.36], ["didgeridoo", 7.57], ["guitar", 7.48]]], "duration": [0.0, 8.05, 6.67, 2.89, 12.24, 0.26, 11.32, 2.34, 3.59, 0.75, 0.91, 3.2, 4.36, 12.13, 0.86, 1.71, 11.69, 13.68, 3.88, 11.97]} \ No newline at end of file diff --git a/annotations_filtered/fsUKVpvzMHk_filtered.json b/annotations_filtered/fsUKVpvzMHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b0a2adbfb49312e7bf41fb9ada7d722e3be22ae --- /dev/null +++ b/annotations_filtered/fsUKVpvzMHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [8.0, 8.55], [9.0, 30.67], [32.0, 32.36], [33.0, 38.21], [39.0, 44.19], [47.0, 48.3], [50.0, 52.12], [56.0, 61.74], [65.0, 65.21], [67.0, 67.91], [70.0, 70.12], [71.0, 72.42], [75.0, 75.96], [78.0, 79.02], [86.0, 87.12], [97.0, 98.04], [99.0, 100.3], [103.0, 104.14], [105.0, 105.66], [107.0, 107.94], [111.0, 111.67], [115.0, 121.05], [122.0, 122.69], [124.0, 123.82], [125.0, 125.61], [127.0, 128.83], [130.0, 131.67], [133.0, 135.4], [137.0, 138.32], [141.0, 141.69], [145.0, 168.91], [170.0, 170.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 72.75, 0.0, 100.0, 68.54, 0.0, 89.36, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 46.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.52], ["music", 19.54], ["foghorn", 14.95]], null], "duration": [0.64, 0.55, 21.67, 0.36, 5.21, 5.19, 1.3, 2.12, 5.74, 0.21, 0.91, 0.12, 1.42, 0.96, 1.02, 1.12, 1.04, 1.3, 1.14, 0.66, 0.94, 0.67, 6.05, 0.69, -0.18, 0.61, 1.83, 1.67, 2.4, 1.32, 0.69, 23.91, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/fsWhDcon8aQ_filtered.json b/annotations_filtered/fsWhDcon8aQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82565f5ecedfc500dddbfc1cf116862f5b522d52 --- /dev/null +++ b/annotations_filtered/fsWhDcon8aQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.52], [21.0, 22.76]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.52, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/fsaidN93VnA_filtered.json b/annotations_filtered/fsaidN93VnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8699e89b79d9d51506045079d9b74a8f90192d4 --- /dev/null +++ b/annotations_filtered/fsaidN93VnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.58], [14.0, 16.26], [17.0, 18.18], [19.0, 19.84], [21.0, 21.93], [23.0, 23.04], [26.0, 26.38], [37.0, 37.05], [39.0, 39.46], [41.0, 41.54], [43.0, 43.73], [45.0, 45.62], [51.0, 51.44], [53.0, 52.69], [58.0, 58.75], [59.0, 60.0], [61.0, 61.87], [63.0, 63.26], [64.0, 65.16], [67.0, 67.26], [72.0, 73.16], [89.0, 90.34], [92.0, 94.19], [97.0, 98.73], [100.0, 100.2], [106.0, 105.87], [107.0, 108.92], [109.0, 109.9], [111.0, 111.86], [113.0, 114.35], [118.0, 118.15], [119.0, 119.57], [121.0, 125.07], [127.0, 127.68], [143.0, 143.88], [145.0, 146.31], [147.0, 150.47], [152.0, 156.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0, 0.0, 0.0, 33.87, 36.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.48], ["music", 8.97], ["sidetone", 4.53]], null, null, null, [["speech", 28.72], ["boing", 18.76], ["stomach rumble", 14.6]], [["speech", 72.67], ["radio", 3.99], ["fart", 3.39]]], "duration": [1.58, 2.26, 1.18, 0.84, 0.93, 0.04, 0.38, 0.05, 0.46, 0.54, 0.73, 0.62, 0.44, -0.31, 0.75, 1.0, 0.87, 0.26, 1.16, 0.26, 1.16, 1.34, 2.19, 1.73, 0.2, -0.13, 1.92, 0.9, 0.86, 1.35, 0.15, 0.57, 4.07, 0.68, 0.88, 1.31, 3.47, 4.56]} \ No newline at end of file diff --git a/annotations_filtered/ft9XnHcLYiI_filtered.json b/annotations_filtered/ft9XnHcLYiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5db03b39d688464b0cfef8615afcbaacff5df5f --- /dev/null +++ b/annotations_filtered/ft9XnHcLYiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.65], [28.0, 28.97], [39.0, 38.91], [49.0, 49.44], [52.0, 52.47], [56.0, 58.02], [60.0, 64.32], [81.0, 90.24], [97.0, 99.3], [100.0, 101.48], [104.0, 105.85], [107.0, 107.0], [110.0, 109.88], [112.0, 112.16], [114.0, 114.76], [127.0, 127.97], [138.0, 138.1], [139.0, 140.36], [143.0, 143.87]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.18, 37.71, 37.66, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["croak", 23.43], ["frog", 10.67], ["hum", 9.29]], [["moo", 27.56], ["cattle, bovinae", 22.29], ["music", 10.65]], [["music", 25.43], ["noise", 6.96], ["scratching (performance technique)", 6.8]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.97, -0.09, 0.44, 0.47, 2.02, 4.32, 9.24, 2.3, 1.48, 1.85, 0.0, -0.12, 0.16, 0.76, 0.97, 0.1, 1.36, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/ftAorMqqjy8_filtered.json b/annotations_filtered/ftAorMqqjy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44b84d797de61bd35ded9bd123ac11dea2ce8707 --- /dev/null +++ b/annotations_filtered/ftAorMqqjy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [4.0, 4.41], [5.0, 5.07], [6.0, 6.34], [10.0, 10.54], [14.0, 14.05], [18.0, 18.05], [20.0, 20.11], [20.0, 20.97], [22.0, 21.84], [27.0, 26.79], [31.0, 30.87], [32.0, 33.79], [39.0, 46.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.71], ["guitar", 24.51], ["plucked string instrument", 11.08]]], "duration": [0.38, 0.41, 0.07, 0.34, 0.54, 0.05, 0.05, 0.11, 0.97, -0.16, -0.21, -0.13, 1.79, 7.72]} \ No newline at end of file diff --git a/annotations_filtered/ftDkeswkEYU_filtered.json b/annotations_filtered/ftDkeswkEYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d9f957ca80d83362615dd9e7726941717cbb2b2 --- /dev/null +++ b/annotations_filtered/ftDkeswkEYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.16], [10.0, 13.2], [15.0, 18.12], [20.0, 22.84], [27.0, 29.76], [38.0, 38.67], [39.0, 40.98], [45.0, 56.56], [59.0, 58.99], [60.0, 61.13], [62.0, 75.14], [80.0, 83.59], [86.0, 92.13], [98.0, 126.86], [127.0, 130.5], [135.0, 134.96], [135.0, 135.06], [135.0, 135.19], [135.0, 136.85], [138.0, 139.77], [141.0, 166.5], [172.0, 172.98], [177.0, 177.45], [178.0, 191.51], [194.0, 197.24], [198.0, 200.97], [201.0, 201.04], [201.0, 203.54], [204.0, 211.96], [214.0, 219.87], [222.0, 223.26], [224.0, 237.84], [240.0, 245.86], [246.0, 249.4], [250.0, 250.87], [253.0, 256.07]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true, true, false, true, true, true, false, true, false, false, false, false], "silence_prob": [44.6, 44.96, 40.92, 30.19, 32.03, 0.0, 0.0, 33.0, 0.0, 0.0, 33.34, 46.19, 31.8, 31.34, 32.46, 0.0, 0.0, 0.0, 0.0, 0.0, 35.28, 0.0, 0.0, 33.56, 30.68, 31.63, 0.0, 29.45, 29.22, 29.23, 0.0, 30.5, 30.68, 58.05, 0.0, 54.56], "audiomae_on_audioset": [[["music", 24.75], ["frog", 16.1], ["animal", 6.72]], [["music", 32.44], ["speech", 28.51], ["quack", 11.4]], [["music", 29.52], ["whale vocalization", 14.82], ["frog", 3.21]], [["music", 34.27], ["speech", 28.81], ["throbbing", 5.67]], [["speech", 51.09], ["music", 18.41], ["throbbing", 5.38]], null, null, [["hum", 31.54], ["music", 15.24], ["throbbing", 14.35]], null, null, [["fly, housefly", 56.22], ["insect", 18.12], ["mosquito", 9.71]], [["music", 30.45], ["frog", 11.77], ["animal", 10.78]], [["speech", 47.73], ["music", 18.0], ["explosion", 4.73]], [["throbbing", 28.1], ["speech", 22.35], ["hum", 18.2]], [["music", 29.13], ["speech", 24.43], ["throbbing", 5.72]], null, null, null, null, null, [["throbbing", 24.93], ["music", 13.39], ["quack", 12.16]], null, null, [["music", 55.21], ["speech", 13.7], ["hum", 7.25]], [["speech", 25.04], ["music", 14.97], ["fly, housefly", 5.39]], [["music", 26.15], ["hum", 13.2], ["throbbing", 6.34]], null, [["music", 36.58], ["whale vocalization", 8.79], ["didgeridoo", 5.36]], [["vehicle", 22.98], ["hum", 17.39], ["car", 13.78]], [["music", 31.58], ["vehicle", 15.07], ["car", 6.38]], null, [["hum", 29.72], ["mains hum", 18.48], ["throbbing", 15.49]], [["speech", 60.99], ["music", 6.44], ["explosion", 4.55]], null, null, null], "duration": [2.16, 3.2, 3.12, 2.84, 2.76, 0.67, 1.98, 11.56, -0.01, 1.13, 13.14, 3.59, 6.13, 28.86, 3.5, -0.04, 0.06, 0.19, 1.85, 1.77, 25.5, 0.98, 0.45, 13.51, 3.24, 2.97, 0.04, 2.54, 7.96, 5.87, 1.26, 13.84, 5.86, 3.4, 0.87, 3.07]} \ No newline at end of file diff --git a/annotations_filtered/ftNK4JPSoto_filtered.json b/annotations_filtered/ftNK4JPSoto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84e2a9d9ef16e00ac2e322dd6dbcdf32771ca0a2 --- /dev/null +++ b/annotations_filtered/ftNK4JPSoto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [4.0, 4.43], [5.0, 6.07], [8.0, 9.46], [12.0, 12.61], [13.0, 19.13], [20.0, 26.52], [32.0, 32.34], [34.0, 35.87], [42.0, 43.04], [46.0, 46.36], [48.0, 48.27], [49.0, 49.79], [57.0, 58.29], [63.0, 63.21], [64.0, 64.88], [65.0, 65.89], [76.0, 76.0], [78.0, 78.0], [82.0, 82.65], [85.0, 85.28], [91.0, 91.91], [94.0, 95.18], [96.0, 99.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.43, 1.07, 1.46, 0.61, 6.13, 6.52, 0.34, 1.87, 1.04, 0.36, 0.27, 0.79, 1.29, 0.21, 0.88, 0.89, 0.0, 0.0, 0.65, 0.28, 0.91, 1.18, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/ftmRf0AY8Co_filtered.json b/annotations_filtered/ftmRf0AY8Co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bb4da04203ba7946ed9dc835258eec7b5448407 --- /dev/null +++ b/annotations_filtered/ftmRf0AY8Co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.45], [21.0, 21.76], [22.0, 34.32], [36.0, 42.35], [47.0, 64.08], [66.0, 71.29], [72.0, 73.94], [75.0, 82.68], [83.0, 87.61], [90.0, 90.48], [90.0, 92.04], [94.0, 104.48], [107.0, 113.41], [116.0, 117.12], [119.0, 124.82], [127.0, 128.88]], "keep_status": [false, false, true, true, false, false, false, true, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 31.53, 32.77, 33.92, 35.36, 0.0, 34.01, 33.14, 0.0, 31.93, 40.93, 39.86, 0.0, 39.14, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.86], ["theremin", 6.61], ["musical instrument", 5.98]], [["music", 34.74], ["gong", 7.87], ["singing bowl", 7.7]], [["music", 69.27], ["musical instrument", 5.4], ["didgeridoo", 4.81]], [["music", 44.62], ["theremin", 28.85], ["musical instrument", 5.25]], null, [["theremin", 27.23], ["whale vocalization", 16.57], ["music", 15.47]], [["music", 46.9], ["theremin", 14.4], ["musical instrument", 14.34]], null, [["theremin", 48.62], ["music", 23.27], ["speech", 15.13]], [["music", 37.44], ["theremin", 14.47], ["speech", 12.36]], [["music", 26.09], ["wind instrument, woodwind instrument", 17.53], ["theremin", 16.29]], null, [["music", 26.37], ["theremin", 18.01], ["speech", 13.62]], null], "duration": [0.45, 0.76, 12.32, 6.35, 17.08, 5.29, 1.94, 7.68, 4.61, 0.48, 2.04, 10.48, 6.41, 1.12, 5.82, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/ftst7XzK21Q_filtered.json b/annotations_filtered/ftst7XzK21Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c020b01116035969086e33141ca16eb79fb927d4 --- /dev/null +++ b/annotations_filtered/ftst7XzK21Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [13.0, 13.78], [17.0, 17.56], [19.0, 20.53], [39.0, 39.29], [47.0, 48.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.93, 0.78, 0.56, 1.53, 0.29, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/fuCEfNfuoiM_filtered.json b/annotations_filtered/fuCEfNfuoiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e672b3ff2e84557674a7d0b061d9d7687bb0025 --- /dev/null +++ b/annotations_filtered/fuCEfNfuoiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.42], [12.0, 22.37], [25.0, 25.69], [29.0, 29.35], [30.0, 38.47], [39.0, 41.64], [43.0, 46.16], [49.0, 51.87], [57.0, 60.56], [61.0, 62.38], [63.0, 73.5], [74.0, 112.21], [113.0, 118.05], [119.0, 118.94], [119.0, 132.63], [133.0, 142.03], [146.0, 153.66], [154.0, 157.84], [159.0, 160.98], [176.0, 178.83], [179.0, 179.0], [196.0, 197.07]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [38.67, 58.38, 0.0, 0.0, 80.46, 98.1, 92.64, 92.15, 86.82, 0.0, 53.84, 0.0, 49.27, 0.0, 50.66, 48.74, 47.31, 68.54, 0.0, 32.72, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.76], ["hum", 22.95], ["throbbing", 11.17]], null, null, null, null, null, null, null, null, null, null, null, [["music", 34.84], ["hum", 11.65], ["throbbing", 8.62]], null, null, [["hum", 48.58], ["throbbing", 28.26], ["mains hum", 10.18]], [["hum", 28.62], ["music", 28.27], ["throbbing", 7.31]], null, null, [["speech", 52.03], ["music", 30.92], ["boing", 2.82]], null, null], "duration": [7.42, 10.37, 0.69, 0.35, 8.47, 2.64, 3.16, 2.87, 3.56, 1.38, 10.5, 38.21, 5.05, -0.06, 13.63, 9.03, 7.66, 3.84, 1.98, 2.83, 0.0, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/fuCe9uaRx_0_filtered.json b/annotations_filtered/fuCe9uaRx_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ab8abaeb6661cf581e8ffd8c186f005f1c04742 --- /dev/null +++ b/annotations_filtered/fuCe9uaRx_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.65], [32.0, 86.68], [88.0, 91.27], [92.0, 96.03], [96.0, 96.92], [98.0, 98.36], [101.0, 106.46]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.99, 34.26, 0.0, 0.0, 44.52], "audiomae_on_audioset": [null, null, null, [["speech", 82.08], ["inside, small room", 1.65], ["sidetone", 1.48]], null, null, [["throbbing", 49.51], ["hum", 26.68], ["heart sounds, heartbeat", 5.74]]], "duration": [0.65, 54.68, 3.27, 4.03, 0.92, 0.36, 5.46]} \ No newline at end of file diff --git a/annotations_filtered/fuEG_PSb_Ts_filtered.json b/annotations_filtered/fuEG_PSb_Ts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e6cb706c516eeb2a6bb6e162d18eb1f9709972 --- /dev/null +++ b/annotations_filtered/fuEG_PSb_Ts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.99], [16.0, 16.24], [21.0, 34.21], [35.0, 36.34], [39.0, 39.68], [44.0, 44.98], [48.0, 54.84], [55.0, 63.32], [64.0, 68.61], [69.0, 70.36], [70.0, 71.9], [73.0, 73.47], [76.0, 80.27], [81.0, 128.22], [135.0, 135.35], [138.0, 138.01], [142.0, 141.99]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [35.02, 0.0, 30.01, 0.0, 0.0, 0.0, 30.55, 30.8, 32.29, 0.0, 0.0, 0.0, 32.38, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.98], ["hum", 23.92], ["mains hum", 11.91]], null, [["music", 51.99], ["hum", 13.77], ["throbbing", 8.57]], null, null, null, [["music", 35.93], ["throbbing", 32.59], ["hum", 17.27]], [["music", 56.89], ["throbbing", 16.56], ["hum", 7.08]], [["moo", 20.76], ["cattle, bovinae", 14.97], ["livestock, farm animals, working animals", 10.74]], null, null, null, [["music", 59.7], ["throbbing", 11.01], ["synthesizer", 4.34]], null, null, null, null], "duration": [10.99, 0.24, 13.21, 1.34, 0.68, 0.98, 6.84, 8.32, 4.61, 1.36, 1.9, 0.47, 4.27, 47.22, 0.35, 0.01, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/fuOY4W9QFNI_filtered.json b/annotations_filtered/fuOY4W9QFNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb1d0a8aa1480e0f0d22a4539ce53cfabdb90254 --- /dev/null +++ b/annotations_filtered/fuOY4W9QFNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.02], [16.0, 16.93], [18.0, 18.54], [20.0, 20.26], [22.0, 22.4], [30.0, 34.05], [36.0, 36.95], [41.0, 41.82], [43.0, 45.39], [46.0, 48.79], [55.0, 55.56], [56.0, 56.96]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [38.12, 0.0, 0.0, 0.0, 0.0, 52.1, 0.0, 0.0, 50.06, 39.52, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.19], ["speech", 19.74], ["moo", 4.43]], null, null, null, null, null, null, null, null, [["music", 36.8], ["speech", 21.31], ["synthesizer", 3.81]], null, null], "duration": [4.02, 0.93, 0.54, 0.26, 0.4, 4.05, 0.95, 0.82, 2.39, 2.79, 0.56, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/futultLrWms_filtered.json b/annotations_filtered/futultLrWms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6021c4d9ae3e3a844865e11966615026e62d89ce --- /dev/null +++ b/annotations_filtered/futultLrWms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [5.0, 9.26], [14.0, 26.11], [28.0, 30.72], [32.0, 35.51], [41.0, 43.43], [45.0, 47.93], [50.0, 50.84], [51.0, 52.37], [55.0, 54.82], [58.0, 60.79], [63.0, 63.41], [68.0, 68.5], [72.0, 72.82], [74.0, 79.96], [84.0, 90.68], [94.0, 98.0], [102.0, 107.92], [109.0, 109.65], [112.0, 115.01], [117.0, 118.13], [122.0, 123.33], [130.0, 131.08], [134.0, 134.74], [138.0, 140.53], [143.0, 148.95], [150.0, 150.52], [152.0, 153.93], [157.0, 157.32], [159.0, 182.55], [186.0, 187.39], [195.0, 196.18], [199.0, 207.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.82, 70.44, 72.31, 84.98, 82.79, 70.72, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 52.92, 39.67, 40.54, 41.66, 0.0, 47.82, 0.0, 0.0, 0.0, 0.0, 33.24, 32.51, 0.0, 0.0, 0.0, 34.61, 0.0, 0.0, 32.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 81.58], ["synthesizer", 3.43], ["ambient music", 1.6]], [["music", 70.96], ["synthesizer", 4.39], ["didgeridoo", 4.16]], [["hum", 49.33], ["throbbing", 13.65], ["music", 13.54]], null, [["music", 64.82], ["singing bowl", 4.39], ["synthesizer", 4.09]], null, null, null, null, [["music", 68.04], ["speech", 2.02], ["didgeridoo", 1.79]], [["music", 78.92], ["hum", 2.08], ["throbbing", 1.5]], null, null, null, [["music", 70.83], ["throbbing", 4.99], ["hum", 4.52]], null, null, [["hum", 39.37], ["music", 18.19], ["mains hum", 12.68]]], "duration": [0.51, 4.26, 12.11, 2.72, 3.51, 2.43, 2.93, 0.84, 1.37, -0.18, 2.79, 0.41, 0.5, 0.82, 5.96, 6.68, 4.0, 5.92, 0.65, 3.01, 1.13, 1.33, 1.08, 0.74, 2.53, 5.95, 0.52, 1.93, 0.32, 23.55, 1.39, 1.18, 8.99]} \ No newline at end of file diff --git a/annotations_filtered/fuwfQJrMgLI_filtered.json b/annotations_filtered/fuwfQJrMgLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f488a288de783335325be26454d739f95edc1c8f --- /dev/null +++ b/annotations_filtered/fuwfQJrMgLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.13], [2.0, 3.67], [6.0, 11.7], [12.0, 13.34], [22.0, 25.08], [47.0, 47.26], [57.0, 61.15], [79.0, 79.27], [80.0, 80.74], [83.0, 83.73], [90.0, 91.08], [91.0, 93.53], [96.0, 96.9], [98.0, 102.32], [106.0, 107.23], [110.0, 116.33], [122.0, 123.58], [125.0, 125.56]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 32.3, 0.0, 31.38, 0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 45.27, 0.0, 54.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.89], ["speech", 14.7], ["sheep", 14.03]], null, [["moo", 40.97], ["cattle, bovinae", 39.28], ["livestock, farm animals, working animals", 19.24]], null, [["livestock, farm animals, working animals", 70.77], ["cattle, bovinae", 17.31], ["moo", 9.0]], null, null, null, null, null, null, [["music", 31.39], ["speech", 13.09], ["glass", 9.82]], null, null, null, null], "duration": [0.13, 1.67, 5.7, 1.34, 3.08, 0.26, 4.15, 0.27, 0.74, 0.73, 1.08, 2.53, 0.9, 4.32, 1.23, 6.33, 1.58, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/fvHgXzOY12Y_filtered.json b/annotations_filtered/fvHgXzOY12Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e82862e94038892bd54a05ccfa9edf48090429 --- /dev/null +++ b/annotations_filtered/fvHgXzOY12Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.59], [15.0, 16.31], [18.0, 23.41], [29.0, 29.79], [31.0, 47.33], [51.0, 51.24], [53.0, 72.81], [85.0, 100.4]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 44.34, 0.0, 35.95, 0.0, 31.47, 33.91], "audiomae_on_audioset": [null, null, [["music", 74.09], ["musical instrument", 5.19], ["synthesizer", 4.15]], null, [["music", 51.29], ["synthesizer", 12.0], ["musical instrument", 4.73]], null, [["music", 69.83], ["speech", 7.19], ["didgeridoo", 2.31]], [["music", 73.02], ["beatboxing", 5.32], ["singing", 2.86]]], "duration": [-0.41, 1.31, 5.41, 0.79, 16.33, 0.24, 19.81, 15.4]} \ No newline at end of file diff --git a/annotations_filtered/fvNfhUZ-5z8_filtered.json b/annotations_filtered/fvNfhUZ-5z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e78c3cfd357394e204ea52ee2d948119c1843789 --- /dev/null +++ b/annotations_filtered/fvNfhUZ-5z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 47.26], [49.0, 54.01], [55.0, 57.18], [63.0, 64.47], [66.0, 68.2], [69.0, 69.74], [75.0, 76.52], [77.0, 79.74], [81.0, 81.35], [82.0, 83.07], [86.0, 86.04], [88.0, 96.28], [97.0, 99.2], [103.0, 104.26], [106.0, 107.3], [108.0, 109.56], [114.0, 114.29], [116.0, 117.09], [123.0, 124.38], [125.0, 125.83], [128.0, 130.64], [138.0, 155.46]], "keep_status": [true, true, true, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [32.92, 34.82, 46.09, 0.0, 49.36, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 53.47, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.19, 31.96], "audiomae_on_audioset": [[["hum", 24.94], ["mains hum", 24.57], ["music", 19.84]], [["music", 31.89], ["knock", 24.02], ["speech", 7.45]], [["hum", 15.1], ["speech", 12.63], ["hiccup", 9.13]], null, [["speech", 43.65], ["music", 9.24], ["hum", 8.99]], null, null, [["speech", 28.14], ["music", 8.28], ["didgeridoo", 7.28]], null, null, null, null, [["speech", 29.02], ["music", 24.47], ["synthesizer", 5.49]], null, null, null, null, null, null, null, [["music", 25.9], ["hum", 12.16], ["mains hum", 9.01]], [["fly, housefly", 49.23], ["insect", 22.31], ["buzz", 10.27]]], "duration": [16.26, 5.01, 2.18, 1.47, 2.2, 0.74, 1.52, 2.74, 0.35, 1.07, 0.04, 8.28, 2.2, 1.26, 1.3, 1.56, 0.29, 1.09, 1.38, 0.83, 2.64, 17.46]} \ No newline at end of file diff --git a/annotations_filtered/fvVBKWMTSRM_filtered.json b/annotations_filtered/fvVBKWMTSRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9ea3f0eed1d2e06b3f143862bf9642bf6d57101 --- /dev/null +++ b/annotations_filtered/fvVBKWMTSRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [3.0, 5.63], [7.0, 9.05], [10.0, 10.47], [17.0, 17.37], [19.0, 23.23], [25.0, 26.27], [31.0, 31.23], [36.0, 38.16], [42.0, 44.58], [47.0, 49.27], [52.0, 54.06], [54.0, 54.87], [57.0, 57.21], [58.0, 58.75], [61.0, 70.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 99.99, 99.94, 0.0, 0.0, 55.11, 0.0, 0.0, 80.11, 90.25, 99.95, 100.0, 0.0, 0.0, 0.0, 42.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 45.72], ["music", 14.63], ["noise", 4.45]]], "duration": [1.17, 2.63, 2.05, 0.47, 0.37, 4.23, 1.27, 0.23, 2.16, 2.58, 2.27, 2.06, 0.87, 0.21, 0.75, 9.33]} \ No newline at end of file diff --git a/annotations_filtered/fvYD-2ggmcc_filtered.json b/annotations_filtered/fvYD-2ggmcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a5e9c58c5ed37fa121e4323ad10baec1b267cb --- /dev/null +++ b/annotations_filtered/fvYD-2ggmcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.59], [9.0, 10.5], [15.0, 14.79], [18.0, 18.37], [29.0, 30.11], [31.0, 33.35], [35.0, 42.06], [43.0, 42.97], [48.0, 48.86], [49.0, 49.84], [51.0, 51.87], [57.0, 57.27], [60.0, 61.82], [65.0, 66.04], [67.0, 67.9], [69.0, 91.3], [93.0, 93.07], [94.0, 94.96], [97.0, 97.29], [98.0, 101.22], [102.0, 107.3], [108.0, 108.67], [124.0, 127.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 89.36, 100.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 1.5, -0.21, 0.37, 1.11, 2.35, 7.06, -0.03, 0.86, 0.84, 0.87, 0.27, 1.82, 1.04, 0.9, 22.3, 0.07, 0.96, 0.29, 3.22, 5.3, 0.67, 3.74]} \ No newline at end of file diff --git a/annotations_filtered/fvoNncvOHfc_filtered.json b/annotations_filtered/fvoNncvOHfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b963d0692d9e2efb69f2872674124226a0d856d --- /dev/null +++ b/annotations_filtered/fvoNncvOHfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 106.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [55.22]} \ No newline at end of file diff --git a/annotations_filtered/fvptWDiYrIk_filtered.json b/annotations_filtered/fvptWDiYrIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..982d66de2ec857daaf98bddc6fdf60ec147965c0 --- /dev/null +++ b/annotations_filtered/fvptWDiYrIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [35.0, 35.77], [52.0, 53.38], [55.0, 55.0]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [1.31, 0.77, 1.38, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/fvuqUVSwpPY_filtered.json b/annotations_filtered/fvuqUVSwpPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fb143768805595e68b750789bd86e551391db96 --- /dev/null +++ b/annotations_filtered/fvuqUVSwpPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.35], [4.0, 6.29], [7.0, 8.28], [9.0, 14.57], [16.0, 17.63], [23.0, 24.9], [31.0, 30.94], [33.0, 33.99], [35.0, 34.69], [36.0, 37.72], [42.0, 43.97], [46.0, 49.25], [50.0, 51.85], [53.0, 59.19], [61.0, 62.82], [68.0, 68.62], [71.0, 74.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.96, 0.0, 51.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.56, 0.0, 60.89, 0.0, 0.0, 83.7], "audiomae_on_audioset": [null, [["sidetone", 44.47], ["whale vocalization", 12.87], ["speech", 12.63]], null, null, null, null, null, null, null, null, null, [["music", 45.08], ["sidetone", 29.18], ["busy signal", 6.87]], null, null, null, null, null], "duration": [1.35, 2.29, 1.28, 5.57, 1.63, 1.9, -0.06, 0.99, -0.31, 1.72, 1.97, 3.25, 1.85, 6.19, 1.82, 0.62, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/fw5N8DF4js8_filtered.json b/annotations_filtered/fw5N8DF4js8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18dfe2ab1d11f671dfe2782a088089f4bd68702f --- /dev/null +++ b/annotations_filtered/fw5N8DF4js8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [7.0, 10.03], [11.0, 15.33], [18.0, 18.66], [27.0, 26.84], [29.0, 30.0], [31.0, 31.72], [38.0, 37.86], [42.0, 42.21], [49.0, 49.74], [51.0, 51.51], [56.0, 56.27], [57.0, 57.38], [61.0, 62.34], [66.0, 66.12], [71.0, 72.15], [76.0, 77.03], [84.0, 85.35], [89.0, 90.54], [91.0, 92.79], [104.0, 104.36], [106.0, 105.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.37, 97.33, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 3.03, 4.33, 0.66, -0.16, 1.0, 0.72, -0.14, 0.21, 0.74, 0.51, 0.27, 0.38, 1.34, 0.12, 1.15, 1.03, 1.35, 1.54, 1.79, 0.36, -0.19]} \ No newline at end of file diff --git a/annotations_filtered/fwI7COVTitQ_filtered.json b/annotations_filtered/fwI7COVTitQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d3211f290b8d0dd65345f96ffff9b34ba33e936 --- /dev/null +++ b/annotations_filtered/fwI7COVTitQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.95], [15.0, 15.97], [18.0, 18.15], [19.0, 31.33], [40.0, 48.15]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.99, 30.7], "audiomae_on_audioset": [null, null, null, [["music", 35.18], ["fly, housefly", 8.9], ["throbbing", 8.36]], [["speech", 47.92], ["music", 27.92], ["buzz", 4.33]]], "duration": [1.95, 0.97, 0.15, 12.33, 8.15]} \ No newline at end of file diff --git a/annotations_filtered/fwITaMQj7S8_filtered.json b/annotations_filtered/fwITaMQj7S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f57cb0bbb1fdc0328b1fc25de2b8b8dafea09f9a --- /dev/null +++ b/annotations_filtered/fwITaMQj7S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 55.31]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.31]} \ No newline at end of file diff --git a/annotations_filtered/fwZw8vujVMU_filtered.json b/annotations_filtered/fwZw8vujVMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38585f18734427c4c849a256883dcdc951296869 --- /dev/null +++ b/annotations_filtered/fwZw8vujVMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.78], [30.0, 31.62], [42.0, 47.29], [59.0, 59.14], [70.0, 72.32], [75.0, 78.44], [79.0, 105.04], [107.0, 107.97], [112.0, 113.88], [117.0, 130.74], [131.0, 132.0], [142.0, 145.88], [151.0, 155.58], [156.0, 156.74], [158.0, 163.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 33.97, 0.0, 34.78, 34.43, 38.63, 0.0, 0.0, 33.81, 0.0, 31.74, 39.25, 0.0, 30.55], "audiomae_on_audioset": [null, null, [["music", 64.33], ["throbbing", 4.65], ["hum", 3.76]], null, [["music", 42.03], ["didgeridoo", 29.36], ["hum", 5.57]], [["music", 58.39], ["hum", 7.72], ["throbbing", 4.81]], [["music", 53.79], ["hum", 18.2], ["throbbing", 6.45]], null, null, [["music", 83.09], ["electronic music", 3.55], ["throbbing", 2.9]], null, [["music", 20.09], ["boing", 18.5], ["groan", 9.56]], [["music", 34.98], ["throbbing", 20.55], ["hum", 9.5]], null, [["music", 73.62], ["speech", 8.53], ["electronic music", 3.7]]], "duration": [0.78, 1.62, 5.29, 0.14, 2.32, 3.44, 26.04, 0.97, 1.88, 13.74, 1.0, 3.88, 4.58, 0.74, 5.92]} \ No newline at end of file diff --git a/annotations_filtered/fwkB6wAxNVM_filtered.json b/annotations_filtered/fwkB6wAxNVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..942acc6b9a0dd777b829b763d65e917fd71be354 --- /dev/null +++ b/annotations_filtered/fwkB6wAxNVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [3.0, 7.38], [8.0, 9.66], [11.0, 18.08], [18.0, 24.11], [24.0, 44.44], [45.0, 94.36], [97.0, 113.44], [115.0, 115.57]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 66.88, 0.0, 34.29, 32.66, 33.62, 0.0, 34.7, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 42.6], ["didgeridoo", 18.33], ["timpani", 6.03]], [["didgeridoo", 60.86], ["music", 21.6], ["speech", 7.05]], [["music", 84.89], ["trombone", 3.17], ["brass instrument", 1.77]], null, [["music", 78.98], ["video game music", 1.82], ["vibraphone", 1.73]], null], "duration": [1.05, 4.38, 1.66, 7.08, 6.11, 20.44, 49.36, 16.44, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/fwkzz6A_Qv4_filtered.json b/annotations_filtered/fwkzz6A_Qv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e62288284e8d9b58a89e906a7dc03c8775f052eb --- /dev/null +++ b/annotations_filtered/fwkzz6A_Qv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.46], [9.0, 12.43], [13.0, 14.61], [15.0, 16.71], [18.0, 18.87], [20.0, 20.93], [26.0, 26.59], [29.0, 28.66], [29.0, 29.94], [34.0, 33.67], [36.0, 35.72], [37.0, 37.08], [38.0, 38.38], [43.0, 44.19], [52.0, 53.05], [54.0, 54.33], [55.0, 55.85], [59.0, 59.24], [62.0, 62.18], [63.0, 64.4], [72.0, 72.86], [76.0, 77.09], [79.0, 79.93], [81.0, 82.19], [83.0, 83.94], [85.0, 89.04], [93.0, 93.6], [95.0, 94.69], [95.0, 96.69], [99.0, 99.94], [101.0, 101.66], [104.0, 104.6], [109.0, 115.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 3.43, 1.61, 1.71, 0.87, 0.93, 0.59, -0.34, 0.94, -0.33, -0.28, 0.08, 0.38, 1.19, 1.05, 0.33, 0.85, 0.24, 0.18, 1.4, 0.86, 1.09, 0.93, 1.19, 0.94, 4.04, 0.6, -0.31, 1.69, 0.94, 0.66, 0.6, 6.55]} \ No newline at end of file diff --git a/annotations_filtered/fxBoqr7OicA_filtered.json b/annotations_filtered/fxBoqr7OicA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1548813a403242d1e6d9c70468866f185bdce5d1 --- /dev/null +++ b/annotations_filtered/fxBoqr7OicA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.66], [16.0, 20.87], [26.0, 26.38], [34.0, 34.15], [35.0, 34.62], [35.0, 37.15], [38.0, 39.95], [41.0, 42.77], [46.0, 51.9], [58.0, 57.82], [62.0, 62.92], [64.0, 71.73], [72.0, 74.48], [85.0, 86.85], [88.0, 88.23], [91.0, 91.45], [94.0, 98.07], [101.0, 101.75], [114.0, 114.84], [117.0, 119.11], [126.0, 127.38], [130.0, 131.53]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.98, 0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 39.67, 0.0, 0.0, 52.39, 33.43, 0.0, 0.0, 0.0, 39.83, 0.0, 0.0, 54.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 39.97], ["telephone", 14.26], ["door", 7.84]], null, null, null, null, null, null, [["speech", 44.74], ["music", 34.48], ["didgeridoo", 6.07]], null, null, null, [["cowbell", 38.94], ["speech", 17.07], ["animal", 14.44]], null, null, null, [["speech", 43.25], ["beatboxing", 18.84], ["music", 10.46]], null, null, null, null, null], "duration": [-0.34, 4.87, 0.38, 0.15, -0.38, 2.15, 1.95, 1.77, 5.9, -0.18, 0.92, 7.73, 2.48, 1.85, 0.23, 0.45, 4.07, 0.75, 0.84, 2.11, 1.38, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/fxVsGcxK1nc_filtered.json b/annotations_filtered/fxVsGcxK1nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3af05747bf10bcb69168b7e5244c4fd1caa9620 --- /dev/null +++ b/annotations_filtered/fxVsGcxK1nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.75], [14.0, 76.59], [78.0, 83.07], [84.0, 85.33], [86.0, 89.73], [91.0, 92.38], [95.0, 102.39]], "keep_status": [true, false, true, false, true, false, true], "silence_prob": [30.65, 0.0, 31.38, 0.0, 40.33, 0.0, 29.32], "audiomae_on_audioset": [[["explosion", 29.51], ["eruption", 14.48], ["hum", 13.42]], null, [["vehicle", 15.13], ["rumble", 11.65], ["creak", 10.69]], null, [["hum", 13.26], ["rumble", 9.79], ["creak", 8.91]], null, [["explosion", 27.86], ["speech", 13.72], ["music", 12.73]]], "duration": [6.75, 62.59, 5.07, 1.33, 3.73, 1.38, 7.39]} \ No newline at end of file diff --git a/annotations_filtered/fxWE6pnuPzo_filtered.json b/annotations_filtered/fxWE6pnuPzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ca572727fcca9a5cf9b805e6513d8cec442440 --- /dev/null +++ b/annotations_filtered/fxWE6pnuPzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.09], [25.0, 27.95], [28.0, 28.02], [62.0, 62.43], [66.0, 68.45], [71.0, 73.53], [78.0, 80.47], [95.0, 96.21], [97.0, 97.85], [114.0, 114.62], [116.0, 116.53], [118.0, 122.15], [131.0, 131.41]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.21, 0.0, 0.0, 65.44, 31.46, 31.8, 0.0, 0.0, 0.0, 0.0, 34.2, 0.0], "audiomae_on_audioset": [null, [["speech", 87.94], ["sidetone", 2.07], ["music", 1.35]], null, null, null, [["speech", 28.27], ["animal", 12.86], ["roaring cats (lions, tigers)", 6.7]], [["baby cry, infant cry", 62.96], ["speech", 14.11], ["crying, sobbing", 4.2]], null, null, null, null, [["speech", 77.95], ["radio", 2.4], ["pant", 1.74]], null], "duration": [0.09, 2.95, 0.02, 0.43, 2.45, 2.53, 2.47, 1.21, 0.85, 0.62, 0.53, 4.15, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/fxriLTLhyyY_filtered.json b/annotations_filtered/fxriLTLhyyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..520da08c9d06d4baebdab82ed29a7d754dd1cc52 --- /dev/null +++ b/annotations_filtered/fxriLTLhyyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [8.0, 10.03], [13.0, 15.84], [17.0, 18.77], [20.0, 21.88], [23.0, 24.58], [25.0, 26.0], [26.0, 26.08], [27.0, 28.73], [30.0, 31.35], [34.0, 34.43], [36.0, 37.07], [37.0, 39.07], [40.0, 50.72], [52.0, 52.86], [55.0, 55.48], [58.0, 58.09], [59.0, 65.45], [72.0, 72.76], [75.0, 74.95], [79.0, 79.34], [80.0, 81.18], [82.0, 84.2], [85.0, 90.1], [92.0, 93.68], [94.0, 97.65], [101.0, 102.36], [114.0, 115.03], [117.0, 118.74], [122.0, 122.89], [124.0, 124.93], [130.0, 130.6], [131.0, 131.53], [133.0, 134.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 91.64, 0.0, 0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 0.0, 31.77, 33.25, 0.0, 42.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.88], ["explosion", 7.49], ["burst, pop", 3.45]], null, null, null, null, [["speech", 36.0], ["boing", 14.85], ["music", 5.91]], [["speech", 54.65], ["boing", 21.12], ["music", 4.32]], null, [["speech", 38.26], ["music", 8.43], ["mains hum", 8.36]], null, null, null, null, null, null, null, null], "duration": [0.89, 2.03, 2.84, 1.77, 1.88, 1.58, 1.0, 0.08, 1.73, 1.35, 0.43, 1.07, 2.07, 10.72, 0.86, 0.48, 0.09, 6.45, 0.76, -0.05, 0.34, 1.18, 2.2, 5.1, 1.68, 3.65, 1.36, 1.03, 1.74, 0.89, 0.93, 0.6, 0.53, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/fy-Ocaxlk1Y_filtered.json b/annotations_filtered/fy-Ocaxlk1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08e7fe00c3033cf41d95c94bfa1160cdc63aad08 --- /dev/null +++ b/annotations_filtered/fy-Ocaxlk1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.55], [29.0, 35.16], [40.0, 43.58], [51.0, 51.8], [53.0, 54.57], [56.0, 59.76], [71.0, 73.3], [78.0, 79.42], [83.0, 85.23], [89.0, 89.8], [91.0, 91.07], [97.0, 99.33], [108.0, 111.91]], "keep_status": [true, true, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [32.7, 31.98, 31.4, 0.0, 0.0, 33.03, 35.84, 0.0, 81.17, 0.0, 0.0, 32.2, 54.56], "audiomae_on_audioset": [[["speech", 18.45], ["explosion", 12.52], ["groan", 8.29]], [["groan", 10.63], ["speech", 9.41], ["fart", 7.41]], [["speech", 66.93], ["sidetone", 6.68], ["music", 5.37]], null, null, [["fly, housefly", 21.56], ["music", 20.83], ["mosquito", 12.86]], [["music", 39.55], ["speech", 8.47], ["musical instrument", 3.12]], null, null, null, null, [["speech", 61.96], ["music", 11.39], ["fly, housefly", 2.73]], null], "duration": [6.55, 6.16, 3.58, 0.8, 1.57, 3.76, 2.3, 1.42, 2.23, 0.8, 0.07, 2.33, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/fy-PoYl4bQI_filtered.json b/annotations_filtered/fy-PoYl4bQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b749e0efe3e47ab3c6100fec25d123ca3dac0c --- /dev/null +++ b/annotations_filtered/fy-PoYl4bQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.67], [24.0, 26.7], [30.0, 30.92], [32.0, 32.51], [37.0, 42.38], [43.0, 44.66], [48.0, 48.24], [49.0, 50.87], [54.0, 54.53], [61.0, 63.32], [68.0, 67.9], [70.0, 70.65], [75.0, 76.08], [77.0, 77.5], [79.0, 86.05], [87.0, 87.67], [89.0, 89.41], [90.0, 90.51], [91.0, 91.17], [92.0, 93.28], [97.0, 97.87], [100.0, 100.01], [101.0, 101.21], [114.0, 114.4], [121.0, 122.44], [126.0, 127.2], [131.0, 131.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.22, 0.0, 0.0, 38.84, 0.0, 0.0, 0.0, 0.0, 42.55, 0.0, 0.0, 0.0, 0.0, 39.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["crushing", 95.56], ["crack", 1.94], ["music", 0.84]], null, null, null, null, [["speech", 62.01], ["radio", 4.96], ["hum", 3.16]], null, null, null, null, [["speech", 51.07], ["sidetone", 38.48], ["music", 1.98]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 2.7, 0.92, 0.51, 5.38, 1.66, 0.24, 1.87, 0.53, 2.32, -0.1, 0.65, 1.08, 0.5, 7.05, 0.67, 0.41, 0.51, 0.17, 1.28, 0.87, 0.01, 0.21, 0.4, 1.44, 1.2, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/fyI46_cfTW4_filtered.json b/annotations_filtered/fyI46_cfTW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..304613b2496b00151d80315c1a63ce3f3a6d6d61 --- /dev/null +++ b/annotations_filtered/fyI46_cfTW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.02], [9.0, 9.34], [23.0, 23.73], [27.0, 28.48], [33.0, 33.34], [36.0, 36.09], [39.0, 40.85], [42.0, 42.55], [46.0, 47.36]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.34, 0.73, 1.48, 0.34, 0.09, 1.85, 0.55, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/fyOv0TB4lXU_filtered.json b/annotations_filtered/fyOv0TB4lXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7e797cedb2ba4d81079311cff9ac6f294e0120c --- /dev/null +++ b/annotations_filtered/fyOv0TB4lXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [2.0, 2.0], [5.0, 5.36], [12.0, 12.9], [14.0, 14.13], [27.0, 38.33], [39.0, 39.87], [45.0, 45.67], [46.0, 49.79], [54.0, 58.01], [58.0, 58.72], [60.0, 63.09], [65.0, 65.65], [67.0, 67.9], [69.0, 69.47], [71.0, 72.0], [73.0, 74.09], [75.0, 75.74], [83.0, 83.34], [84.0, 84.86], [86.0, 91.1], [91.0, 93.99], [95.0, 95.44], [113.0, 114.24], [117.0, 117.1], [135.0, 135.57], [139.0, 142.43], [143.0, 146.13], [149.0, 153.64], [157.0, 157.74], [159.0, 159.09], [176.0, 176.49], [183.0, 184.69], [188.0, 190.16]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.17, 0.0, 0.0, 32.38, 34.72, 0.0, 32.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.03, 31.41, 0.0, 0.0, 0.0, 0.0, 29.91, 32.36, 32.0, 0.0, 0.0, 0.0, 0.0, 31.32], "audiomae_on_audioset": [null, null, null, null, null, [["music", 36.49], ["speech", 35.62], ["boing", 9.05]], null, null, [["cattle, bovinae", 47.85], ["moo", 33.61], ["livestock, farm animals, working animals", 13.35]], [["frog", 26.23], ["animal", 12.25], ["chirp, tweet", 9.65]], null, [["animal", 32.95], ["wild animals", 9.68], ["whale vocalization", 8.84]], null, null, null, null, null, null, null, null, [["boing", 70.37], ["moo", 7.13], ["cattle, bovinae", 5.39]], [["boing", 23.31], ["speech", 14.65], ["cattle, bovinae", 9.66]], null, null, null, null, [["music", 27.24], ["carnatic music", 7.13], ["musical instrument", 5.76]], [["boing", 21.88], ["music", 18.55], ["music for children", 9.33]], [["boing", 45.07], ["sheep", 8.97], ["music", 8.25]], null, null, null, null, [["music", 54.49], ["speech", 8.37], ["musical instrument", 1.97]]], "duration": [0.48, 0.0, 0.36, 0.9, 0.13, 11.33, 0.87, 0.67, 3.79, 4.01, 0.72, 3.09, 0.65, 0.9, 0.47, 1.0, 1.09, 0.74, 0.34, 0.86, 5.1, 2.99, 0.44, 1.24, 0.1, 0.57, 3.43, 3.13, 4.64, 0.74, 0.09, 0.49, 1.69, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/fygiSfJjTLc_filtered.json b/annotations_filtered/fygiSfJjTLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48fa7fbdf72415179cd2f2343bc63ec47a8f7455 --- /dev/null +++ b/annotations_filtered/fygiSfJjTLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.96], [36.0, 36.54], [43.0, 62.78], [66.0, 69.25], [78.0, 83.62], [84.0, 85.16], [86.0, 96.42], [98.0, 99.72], [102.0, 103.91], [104.0, 107.74], [108.0, 108.9], [115.0, 115.48], [116.0, 117.17], [120.0, 120.04], [121.0, 128.19], [128.0, 128.24], [128.0, 131.21], [139.0, 148.83], [155.0, 157.57], [159.0, 159.36], [161.0, 161.25]], "keep_status": [true, false, true, true, false, false, true, false, false, true, false, false, false, false, true, false, true, true, true, false, false], "silence_prob": [35.21, 0.0, 32.11, 30.16, 30.74, 0.0, 30.58, 0.0, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 30.48, 0.0, 31.06, 30.59, 40.84, 0.0, 0.0], "audiomae_on_audioset": [[["rumble", 24.33], ["music", 13.49], ["field recording", 6.38]], null, [["hum", 34.71], ["rumble", 14.85], ["mains hum", 10.59]], [["vehicle", 26.92], ["race car, auto racing", 11.81], ["buzz", 11.22]], [["sidetone", 39.9], ["speech", 37.86], ["radio", 2.95]], null, [["speech", 29.98], ["music", 15.7], ["hum", 12.69]], null, null, [["speech", 24.22], ["throbbing", 10.17], ["cheering", 9.73]], null, null, null, null, [["civil defense siren", 11.7], ["speech", 8.42], ["music", 6.34]], null, [["moo", 34.0], ["cattle, bovinae", 28.59], ["livestock, farm animals, working animals", 6.94]], [["music", 35.9], ["didgeridoo", 11.79], ["speech", 9.58]], [["hum", 31.66], ["mains hum", 21.65], ["music", 5.79]], null, null], "duration": [25.96, 0.54, 19.78, 3.25, 5.62, 1.16, 10.42, 1.72, 1.91, 3.74, 0.9, 0.48, 1.17, 0.04, 7.19, 0.24, 3.21, 9.83, 2.57, 0.36, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/fz19xrc_99o_filtered.json b/annotations_filtered/fz19xrc_99o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fe9b1c636b4ce316c96eed7bcdc44d7f1925ef3 --- /dev/null +++ b/annotations_filtered/fz19xrc_99o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.18], [15.0, 18.13], [20.0, 20.9], [21.0, 25.02], [27.0, 48.19], [49.0, 59.95], [60.0, 60.94], [64.0, 67.41], [72.0, 71.86], [73.0, 72.99], [74.0, 76.84], [80.0, 89.83]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.75, 99.21, 0.0, 57.81, 70.3, 66.39, 0.0, 80.29, 0.0, 0.0, 81.89, 81.17], "audiomae_on_audioset": [[["speech", 38.1], ["sidetone", 20.11], ["fly, housefly", 6.23]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.18, 3.13, 0.9, 4.02, 21.19, 10.95, 0.94, 3.41, -0.14, -0.01, 2.84, 9.83]} \ No newline at end of file diff --git a/annotations_filtered/fzAKSbtYBMU_filtered.json b/annotations_filtered/fzAKSbtYBMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f14f9e35867055eab1b227320fb8db0543fdfcf --- /dev/null +++ b/annotations_filtered/fzAKSbtYBMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [5.0, 5.46], [5.0, 5.51], [7.0, 8.45], [8.0, 8.48], [9.0, 8.61], [9.0, 117.58], [119.0, 120.24], [121.0, 121.44]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.46, 0.51, 1.45, 0.48, -0.39, 108.58, 1.24, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/fzXK1hDkqYc_filtered.json b/annotations_filtered/fzXK1hDkqYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7df49870934dc4bd1a066288a6dd20b04be392d6 --- /dev/null +++ b/annotations_filtered/fzXK1hDkqYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 45.25], [46.0, 47.38], [49.0, 49.65], [52.0, 52.64], [55.0, 55.31], [56.0, 57.06], [60.0, 60.64], [62.0, 62.06], [63.0, 63.02], [64.0, 65.48], [68.0, 68.76], [79.0, 78.88], [83.0, 84.11], [86.0, 86.59], [87.0, 87.54], [88.0, 88.23], [101.0, 102.39], [103.0, 102.78], [106.0, 106.81], [108.0, 108.28], [109.0, 109.0], [121.0, 120.88], [125.0, 125.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [30.25, 1.38, 0.65, 0.64, 0.31, 1.06, 0.64, 0.06, 0.02, 1.48, 0.76, -0.12, 1.11, 0.59, 0.54, 0.23, 1.39, -0.22, 0.81, 0.28, 0.0, -0.12, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/fz_9uPJnGEQ_filtered.json b/annotations_filtered/fz_9uPJnGEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3643de0711122e2eb8c6d27d383ccfb0dc83d0e8 --- /dev/null +++ b/annotations_filtered/fz_9uPJnGEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.36], [6.0, 7.64], [9.0, 11.48], [12.0, 23.06], [24.0, 24.39], [25.0, 29.05], [29.0, 29.62], [30.0, 30.32], [31.0, 32.56], [34.0, 39.7], [40.0, 41.86], [42.0, 43.66], [44.0, 45.64], [47.0, 49.87], [51.0, 55.86], [58.0, 58.77], [59.0, 60.35], [61.0, 62.46], [64.0, 65.06], [67.0, 66.93], [68.0, 70.09], [73.0, 74.28], [75.0, 75.44], [76.0, 76.3], [78.0, 78.09], [79.0, 78.68], [79.0, 79.83], [82.0, 82.38], [83.0, 83.88], [84.0, 85.23], [87.0, 87.17], [88.0, 88.84], [89.0, 89.33], [90.0, 90.63], [91.0, 92.96], [94.0, 95.62], [96.0, 99.22], [102.0, 103.98], [105.0, 108.11], [110.0, 110.62], [111.0, 112.01], [112.0, 112.87], [113.0, 115.7], [116.0, 123.18], [124.0, 125.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [91.13, 0.0, 97.92, 96.89, 0.0, 78.72, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 80.82, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 73.82, 0.0, 0.0, 0.0, 81.71, 46.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 40.27], ["cattle, bovinae", 18.98], ["moo", 15.45]], null, null, null, null, null, [["music", 45.31], ["speech", 18.81], ["theremin", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.9], ["crow", 15.76], ["caw", 8.57]], null], "duration": [2.36, 1.64, 2.48, 11.06, 0.39, 4.05, 0.62, 0.32, 1.56, 5.7, 1.86, 1.66, 1.64, 2.87, 4.86, 0.77, 1.35, 1.46, 1.06, -0.07, 2.09, 1.28, 0.44, 0.3, 0.09, -0.32, 0.83, 0.38, 0.88, 1.23, 0.17, 0.84, 0.33, 0.63, 1.96, 1.62, 3.22, 1.98, 3.11, 0.62, 1.01, 0.87, 2.7, 7.18, 1.25]} \ No newline at end of file