diff --git a/annotations_filtered/i-2kXcQgs_w_filtered.json b/annotations_filtered/i-2kXcQgs_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6800b234e211ce713747d1ed25f7a95c685de8ac --- /dev/null +++ b/annotations_filtered/i-2kXcQgs_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.78], [5.0, 5.75], [10.0, 13.36], [14.0, 15.01], [16.0, 16.77], [18.0, 20.82], [21.0, 21.03], [21.0, 21.07], [21.0, 21.44], [22.0, 22.6], [25.0, 30.13], [33.0, 34.37], [35.0, 36.96], [38.0, 44.36], [45.0, 49.72], [53.0, 53.11], [55.0, 55.92], [60.0, 64.03], [67.0, 68.57], [70.0, 71.25], [73.0, 74.63], [76.0, 85.65], [90.0, 91.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.81, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 29.86, 0.0, 0.0, 100.0, 99.85, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 49.05], ["sidetone", 14.96], ["crackle", 3.11]], null, null, null, null, null, null, null, [["speech", 48.12], ["whack, thwack", 13.41], ["music", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.75, 3.36, 1.01, 0.77, 2.82, 0.03, 0.07, 0.44, 0.6, 5.13, 1.37, 1.96, 6.36, 4.72, 0.11, 0.92, 4.03, 1.57, 1.25, 1.63, 9.65, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/i-9K5-x7_so_filtered.json b/annotations_filtered/i-9K5-x7_so_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e46fd4ad1298f72aa772d7714d7bb88cd09152 --- /dev/null +++ b/annotations_filtered/i-9K5-x7_so_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 69.01], [70.0, 70.48], [71.0, 71.52], [77.0, 80.33], [84.0, 84.99], [91.0, 92.55], [96.0, 100.8], [102.0, 121.17], [124.0, 124.82], [126.0, 126.93], [130.0, 131.21], [132.0, 132.56], [135.0, 136.07], [141.0, 141.29], [145.0, 146.23], [150.0, 150.89], [154.0, 153.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.59, 0.0, 0.0, 37.42, 0.0, 0.0, 35.94, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.97], ["speech", 13.75], ["synthesizer", 11.25]], null, null, [["music", 62.4], ["speech", 13.3], ["musical instrument", 4.67]], null, null, [["music", 56.29], ["speech", 12.83], ["drum machine", 9.63]], [["music", 91.99], ["synthesizer", 1.46], ["musical instrument", 1.26]], null, null, null, null, null, null, null, null, null], "duration": [2.01, 0.48, 0.52, 3.33, 0.99, 1.55, 4.8, 19.17, 0.82, 0.93, 1.21, 0.56, 1.07, 0.29, 1.23, 0.89, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/i-VM7_DJlkQ_filtered.json b/annotations_filtered/i-VM7_DJlkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9581c3b788f66cf5fa74cdb53f5bba670a0ae780 --- /dev/null +++ b/annotations_filtered/i-VM7_DJlkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 78.49], [81.0, 81.48]], "keep_status": [true, false], "silence_prob": [33.35, 0.0], "audiomae_on_audioset": [[["music", 14.52], ["moo", 11.24], ["fly, housefly", 10.63]], null], "duration": [27.49, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/i-VeLFEMeko_filtered.json b/annotations_filtered/i-VeLFEMeko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16f1d3195cc26d7f5bc61160eade1f1803063788 --- /dev/null +++ b/annotations_filtered/i-VeLFEMeko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.7], [38.0, 38.89], [40.0, 41.01], [44.0, 44.86], [46.0, 46.74], [51.0, 55.32], [57.0, 57.91], [59.0, 64.89], [77.0, 78.21], [78.0, 79.89], [90.0, 94.85], [100.0, 101.06], [102.0, 103.81], [105.0, 105.92], [108.0, 108.3], [111.0, 112.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.43, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 98.8, 0.0, 0.0, 30.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 44.12], ["crack", 16.66], ["thunk", 10.3]], null, null, null, null, null], "duration": [2.7, 0.89, 1.01, 0.86, 0.74, 4.32, 0.91, 5.89, 1.21, 1.89, 4.85, 1.06, 1.81, 0.92, 0.3, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/i-bRuSNSvcU_filtered.json b/annotations_filtered/i-bRuSNSvcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbeb376b5dd9860b7e35e5242f31ee6a632aaf79 --- /dev/null +++ b/annotations_filtered/i-bRuSNSvcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 57.84], [59.0, 61.23], [61.0, 61.62], [62.0, 61.86], [63.0, 67.04], [68.0, 67.88], [72.0, 73.67], [75.0, 77.68], [80.0, 80.05], [92.0, 91.89], [93.0, 93.72], [94.0, 96.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 79.94, 0.0, 0.0, 83.16, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [30.84, 2.23, 0.62, -0.14, 4.04, -0.12, 1.67, 2.68, 0.05, -0.11, 0.72, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/i-f0M5TqmsY_filtered.json b/annotations_filtered/i-f0M5TqmsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1392981c538bf5221cf62517310aa4885645e33 --- /dev/null +++ b/annotations_filtered/i-f0M5TqmsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [4.0, 4.92], [20.0, 19.9], [27.0, 27.67], [37.0, 37.99], [44.0, 44.59], [48.0, 47.9], [50.0, 49.91], [53.0, 52.89], [54.0, 53.94], [55.0, 55.49], [68.0, 67.9], [69.0, 68.77], [80.0, 81.55], [82.0, 83.12], [101.0, 101.31], [103.0, 103.23], [105.0, 104.92], [113.0, 114.47], [116.0, 116.72], [122.0, 122.0], [123.0, 126.76], [129.0, 131.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.92, -0.1, 0.67, 0.99, 0.59, -0.1, -0.09, -0.11, -0.06, 0.49, -0.1, -0.23, 1.55, 1.12, 0.31, 0.23, -0.08, 1.47, 0.72, 0.0, 3.76, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/i07yEczcujQ_filtered.json b/annotations_filtered/i07yEczcujQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fef55c8bd8975f654568b00e668849d0e4a18e9a --- /dev/null +++ b/annotations_filtered/i07yEczcujQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.65], [13.0, 15.03], [16.0, 16.73], [18.0, 18.17], [19.0, 19.8], [21.0, 21.84], [27.0, 27.11], [29.0, 30.05], [34.0, 37.25], [42.0, 42.9], [44.0, 45.25], [49.0, 50.06], [55.0, 55.12], [57.0, 57.72], [65.0, 65.06], [77.0, 78.24], [80.0, 80.76], [85.0, 86.91], [88.0, 88.69], [90.0, 90.53], [91.0, 92.33], [93.0, 93.99], [97.0, 97.46], [100.0, 100.62], [104.0, 104.33], [107.0, 107.43], [108.0, 108.99]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.49], ["whale vocalization", 15.65], ["hum", 7.21]], null, null, null, null, null, null, [["music", 58.09], ["theremin", 13.29], ["musical instrument", 6.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 2.03, 0.73, 0.17, 0.8, 0.84, 0.11, 1.05, 3.25, 0.9, 1.25, 1.06, 0.12, 0.72, 0.06, 1.24, 0.76, 1.91, 0.69, 0.53, 1.33, 0.99, 0.46, 0.62, 0.33, 0.43, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/i0p2X2rQ6Ag_filtered.json b/annotations_filtered/i0p2X2rQ6Ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb4acd7818eded6cf1de2f98e268df2e72421ba9 --- /dev/null +++ b/annotations_filtered/i0p2X2rQ6Ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.5], [19.0, 20.11], [22.0, 23.08], [27.0, 27.21], [31.0, 32.17], [37.0, 37.59], [41.0, 41.49], [43.0, 52.29], [53.0, 53.54], [71.0, 78.58], [80.0, 81.06], [81.0, 81.14], [81.0, 81.55], [86.0, 86.78], [93.0, 94.47], [96.0, 97.31], [99.0, 101.04], [103.0, 104.43], [106.0, 108.33], [110.0, 112.11], [115.0, 116.4], [117.0, 124.33], [127.0, 127.84]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [44.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71, 0.0, 49.4, 90.95, 0.0, 71.57, 0.0], "audiomae_on_audioset": [[["speech", 22.59], ["mosquito", 20.25], ["fly, housefly", 12.66]], null, null, null, null, null, null, [["music", 68.21], ["musical instrument", 10.08], ["plucked string instrument", 3.78]], null, null, null, null, null, null, null, null, null, null, [["music", 49.12], ["synthesizer", 13.21], ["effects unit", 6.37]], null, null, null, null], "duration": [5.5, 1.11, 1.08, 0.21, 1.17, 0.59, 0.49, 9.29, 0.54, 7.58, 1.06, 0.14, 0.55, 0.78, 1.47, 1.31, 2.04, 1.43, 2.33, 2.11, 1.4, 7.33, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/i1Nh_3JCFj8_filtered.json b/annotations_filtered/i1Nh_3JCFj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29bbd923d85d3ed7df5077a39611e09c0a51416d --- /dev/null +++ b/annotations_filtered/i1Nh_3JCFj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.97], [20.0, 21.05], [29.0, 30.43], [32.0, 32.54], [46.0, 47.85], [52.0, 52.59], [65.0, 66.06], [67.0, 67.81], [79.0, 79.41], [80.0, 80.91], [83.0, 82.95], [85.0, 85.9], [87.0, 87.67], [88.0, 88.48], [100.0, 101.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 1.05, 1.43, 0.54, 1.85, 0.59, 1.06, 0.81, 0.41, 0.91, -0.05, 0.9, 0.67, 0.48, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/i1ZUVkU_XK4_filtered.json b/annotations_filtered/i1ZUVkU_XK4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c92ffc61e0058596b37e68ef27ab808bdc2c18a --- /dev/null +++ b/annotations_filtered/i1ZUVkU_XK4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [4.0, 4.75], [6.0, 7.42], [8.0, 9.63], [10.0, 10.79], [18.0, 18.89], [20.0, 21.0], [25.0, 25.08], [26.0, 43.21], [45.0, 45.62], [46.0, 48.51], [51.0, 57.64], [85.0, 85.55], [90.0, 89.78], [94.0, 101.95], [106.0, 113.73], [114.0, 114.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.89, 0.0, 46.29, 50.16, 0.0, 0.0, 52.92, 58.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 30.73], ["electric shaver, electric razor", 29.48], ["hum", 17.69]], null, [["music", 31.51], ["speech", 14.19], ["fireworks", 4.47]], null, null, null, null, null, null], "duration": [0.37, 0.75, 1.42, 1.63, 0.79, 0.89, 1.0, 0.08, 17.21, 0.62, 2.51, 6.64, 0.55, -0.22, 7.95, 7.73, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/i1igdJh44yU_filtered.json b/annotations_filtered/i1igdJh44yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed6adcd8b04ea7423a8761403bbf52a47ce90ff --- /dev/null +++ b/annotations_filtered/i1igdJh44yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 34.18], [70.0, 71.42], [74.0, 96.31], [97.0, 97.78], [98.0, 99.49], [101.0, 102.41], [109.0, 111.42], [116.0, 117.12], [123.0, 124.95], [130.0, 131.48], [141.0, 143.45], [148.0, 148.09], [156.0, 158.3]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [28.51, 0.0, 28.83, 0.0, 0.0, 0.0, 32.82, 0.0, 0.0, 0.0, 37.04, 0.0, 34.88], "audiomae_on_audioset": [[["music", 62.8], ["electronic music", 11.65], ["speech", 4.74]], null, [["music", 92.84], ["techno", 1.69], ["electronic music", 1.42]], null, null, null, [["livestock, farm animals, working animals", 18.75], ["moo", 16.55], ["sheep", 15.99]], null, null, null, [["speech", 26.5], ["fly, housefly", 15.29], ["insect", 10.15]], null, [["sheep", 13.73], ["bleat", 11.43], ["fly, housefly", 10.85]]], "duration": [25.18, 1.42, 22.31, 0.78, 1.49, 1.41, 2.42, 1.12, 1.95, 1.48, 2.45, 0.09, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/i1lkrSFlpss_filtered.json b/annotations_filtered/i1lkrSFlpss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6543ffb7539dca277095960d9b81b2bb1ee828c8 --- /dev/null +++ b/annotations_filtered/i1lkrSFlpss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [5.0, 8.55], [12.0, 14.57], [21.0, 21.71], [23.0, 26.76], [29.0, 29.15], [31.0, 36.66], [37.0, 38.65], [45.0, 50.8], [54.0, 54.11], [56.0, 56.76], [61.0, 64.54], [66.0, 67.88], [68.0, 69.67], [77.0, 80.82], [82.0, 83.93]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.93, 96.66, 0.0, 94.37, 0.0, 97.33, 0.0, 82.97, 0.0, 0.0, 98.8, 0.0, 0.0, 89.54, 0.0], "audiomae_on_audioset": [null, [["hum", 35.82], ["music", 14.8], ["mains hum", 11.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 3.55, 2.57, 0.71, 3.76, 0.15, 5.66, 1.65, 5.8, 0.11, 0.76, 3.54, 1.88, 1.67, 3.82, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/i1n8bNgTUTw_filtered.json b/annotations_filtered/i1n8bNgTUTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3cde7fd25a3561fe08b2e41d6e36ffa48204a7c --- /dev/null +++ b/annotations_filtered/i1n8bNgTUTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [5.0, 6.03], [8.0, 13.39], [15.0, 15.26], [16.0, 16.46], [19.0, 20.66], [23.0, 26.99], [41.0, 42.65], [47.0, 49.69], [54.0, 55.75], [58.0, 61.28], [64.0, 65.53], [68.0, 70.34], [71.0, 72.96], [75.0, 75.91], [78.0, 79.51], [83.0, 83.98], [86.0, 87.84], [91.0, 94.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 76.86, 0.0, 51.07, 0.0, 56.78, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.03, 5.39, 0.26, 0.46, 1.66, 3.99, 1.65, 2.69, 1.75, 3.28, 1.53, 2.34, 1.96, 0.91, 1.51, 0.98, 1.84, 3.76]} \ No newline at end of file diff --git a/annotations_filtered/i2gVXd7FzhQ_filtered.json b/annotations_filtered/i2gVXd7FzhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66ecc66fc8ec715cfc476e961b49439ad7d8a6a2 --- /dev/null +++ b/annotations_filtered/i2gVXd7FzhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.82], [14.0, 15.21], [18.0, 20.06], [24.0, 26.45], [32.0, 33.05], [37.0, 37.23], [38.0, 39.07], [40.0, 41.12], [42.0, 43.33], [46.0, 45.96], [47.0, 49.32], [51.0, 52.22], [56.0, 56.05], [57.0, 61.11], [63.0, 63.37], [64.0, 68.59], [70.0, 71.66], [73.0, 73.58], [77.0, 118.62], [119.0, 127.26], [131.0, 132.58], [134.0, 133.98], [135.0, 135.13], [136.0, 137.49], [139.0, 139.68], [144.0, 150.87], [152.0, 152.41], [155.0, 169.45], [195.0, 199.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 99.48, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 61.97, 0.0, 51.07, 0.0, 0.0, 0.0, 37.24, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 0.0, 34.18, 61.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 21.42], ["sheep", 21.21], ["speech", 12.34]], null, null, null, null, null, [["music", 32.66], ["sonar", 8.38], ["cattle, bovinae", 8.12]], null, [["music", 66.64], ["didgeridoo", 23.64], ["throbbing", 2.27]], null], "duration": [0.82, 1.21, 2.06, 2.45, 1.05, 0.23, 1.07, 1.12, 1.33, -0.04, 2.32, 1.22, 0.05, 4.11, 0.37, 4.59, 1.66, 0.58, 41.62, 8.26, 1.58, -0.02, 0.13, 1.49, 0.68, 6.87, 0.41, 14.45, 4.94]} \ No newline at end of file diff --git a/annotations_filtered/i2xyQnF1kro_filtered.json b/annotations_filtered/i2xyQnF1kro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b73a6af2d0bdcc62c443e4636d02d5550b367abf --- /dev/null +++ b/annotations_filtered/i2xyQnF1kro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [5.0, 21.29], [25.0, 26.33], [27.0, 28.92], [30.0, 30.52], [39.0, 43.39], [44.0, 44.09], [45.0, 45.74], [47.0, 47.51], [53.0, 54.41], [55.0, 56.69], [61.0, 61.26], [62.0, 67.83], [83.0, 84.32], [86.0, 87.13], [88.0, 89.18], [91.0, 93.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 73.21, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.01], ["fly, housefly", 17.05], ["insect", 9.94]], null, null, null, null], "duration": [0.04, 16.29, 1.33, 1.92, 0.52, 4.39, 0.09, 0.74, 0.51, 1.41, 1.69, 0.26, 5.83, 1.32, 1.13, 1.18, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/i31XFSORRfc_filtered.json b/annotations_filtered/i31XFSORRfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bdf27a1003d57e9ad5141a1c68aa02e02bce97 --- /dev/null +++ b/annotations_filtered/i31XFSORRfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.72], [37.0, 45.1], [46.0, 51.04], [58.0, 64.05], [66.0, 66.5], [68.0, 95.77], [96.0, 106.76], [108.0, 111.96], [113.0, 123.42], [125.0, 125.27], [126.0, 131.52], [133.0, 135.58], [139.0, 159.33]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [28.83, 29.49, 29.61, 34.56, 0.0, 32.56, 30.6, 42.58, 30.03, 0.0, 61.18, 29.71, 29.77], "audiomae_on_audioset": [[["music", 31.67], ["hum", 21.22], ["rumble", 10.66]], [["hum", 30.48], ["mains hum", 24.58], ["rumble", 15.42]], [["music", 60.87], ["hum", 5.59], ["mains hum", 4.6]], [["hum", 29.71], ["music", 24.93], ["mains hum", 21.21]], null, [["music", 43.6], ["hum", 29.88], ["mains hum", 12.04]], [["hum", 41.93], ["mains hum", 14.03], ["music", 14.03]], [["music", 67.71], ["sonar", 4.39], ["synthesizer", 3.43]], [["music", 57.83], ["scary music", 16.85], ["speech", 9.69]], null, null, [["music", 51.76], ["speech", 23.55], ["mains hum", 6.43]], [["music", 44.19], ["buzz", 9.36], ["mains hum", 5.14]]], "duration": [8.72, 8.1, 5.04, 6.05, 0.5, 27.77, 10.76, 3.96, 10.42, 0.27, 5.52, 2.58, 20.33]} \ No newline at end of file diff --git a/annotations_filtered/i3EF63p3v-I_filtered.json b/annotations_filtered/i3EF63p3v-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af2b8e9d64011ca57c509b880928bedbbea64cb --- /dev/null +++ b/annotations_filtered/i3EF63p3v-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [10.0, 11.82], [13.0, 16.02], [17.0, 23.95], [29.0, 35.56], [42.0, 43.44], [45.0, 47.19], [48.0, 48.74], [50.0, 50.6], [51.0, 52.05], [56.0, 56.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.54, 67.0, 64.18, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 1.82, 3.02, 6.95, 6.56, 1.44, 2.19, 0.74, 0.6, 1.05, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/i3JbGwGNRI8_filtered.json b/annotations_filtered/i3JbGwGNRI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7b12c861f81bcb7d9b975068275831c5fb8a47c --- /dev/null +++ b/annotations_filtered/i3JbGwGNRI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [9.0, 8.87], [11.0, 11.94], [19.0, 19.06], [20.0, 21.96], [23.0, 31.6]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.68], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 24.86], ["music", 12.08], ["mains hum", 10.71]]], "duration": [0.52, -0.13, 0.94, 0.06, 1.96, 8.6]} \ No newline at end of file diff --git a/annotations_filtered/i3VNgECX8Ko_filtered.json b/annotations_filtered/i3VNgECX8Ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e335a6d1b95ca7e954f444259faf8b305b3c0b5 --- /dev/null +++ b/annotations_filtered/i3VNgECX8Ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.49], [24.0, 26.49], [29.0, 61.16], [63.0, 70.71], [71.0, 71.0], [72.0, 72.13], [76.0, 111.48], [112.0, 111.52]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 36.41, 0.0, 34.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 42.58], ["hum", 8.19], ["vehicle", 6.54]], null, [["music", 45.39], ["speech", 14.19], ["throbbing", 6.81]], null, null, null, null], "duration": [1.49, 2.49, 32.16, 7.71, 0.0, 0.13, 35.48, -0.48]} \ No newline at end of file diff --git a/annotations_filtered/i3xjZomB1s0_filtered.json b/annotations_filtered/i3xjZomB1s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a54e4bd8be4de7c5cb0e263535ada8f089eda905 --- /dev/null +++ b/annotations_filtered/i3xjZomB1s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [6.0, 18.35], [20.0, 19.7], [33.0, 40.29], [41.0, 41.76], [43.0, 43.6], [44.0, 45.06], [64.0, 66.68], [68.0, 69.01], [70.0, 70.56], [71.0, 72.35], [74.0, 74.58], [79.0, 79.66], [82.0, 82.46], [88.0, 89.01], [92.0, 92.52], [93.0, 94.14], [96.0, 96.47], [99.0, 100.01], [102.0, 107.74], [114.0, 114.39], [115.0, 115.94], [118.0, 118.2], [128.0, 129.9]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.31, 0.0, 32.8, 0.0, 0.0, 0.0, 34.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sound effect", 12.61], ["vehicle", 12.56], ["buzz", 10.13]], null, [["music", 32.49], ["hum", 19.25], ["mains hum", 13.73]], null, null, null, [["music", 29.43], ["didgeridoo", 10.86], ["foghorn", 9.1]], null, null, null, null, null, null, null, null, null, null, null, [["music", 52.53], ["theremin", 19.7], ["brass instrument", 5.91]], null, null, null, null], "duration": [1.38, 12.35, -0.3, 7.29, 0.76, 0.6, 1.06, 2.68, 1.01, 0.56, 1.35, 0.58, 0.66, 0.46, 1.01, 0.52, 1.14, 0.47, 1.01, 5.74, 0.39, 0.94, 0.2, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/i3yO0OagpNY_filtered.json b/annotations_filtered/i3yO0OagpNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6df3013821b5a1252ee6035f000eb7c97479aeb0 --- /dev/null +++ b/annotations_filtered/i3yO0OagpNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.45], [24.0, 33.45], [34.0, 34.2], [37.0, 37.77], [41.0, 41.76], [42.0, 59.95], [61.0, 83.2], [83.0, 86.21], [91.0, 116.95], [118.0, 123.75], [124.0, 124.88], [128.0, 154.95]], "keep_status": [true, true, false, false, false, true, true, true, true, true, false, true], "silence_prob": [30.42, 33.9, 0.0, 0.0, 0.0, 35.73, 42.13, 33.85, 30.39, 28.88, 0.0, 28.82], "audiomae_on_audioset": [[["music", 34.23], ["brass instrument", 16.41], ["foghorn", 7.97]], [["music", 50.74], ["brass instrument", 8.72], ["didgeridoo", 8.42]], null, null, null, [["music", 47.46], ["effects unit", 10.6], ["musical instrument", 7.21]], [["music", 51.33], ["synthesizer", 11.76], ["theremin", 5.42]], [["music", 47.53], ["musical instrument", 6.59], ["foghorn", 2.95]], [["music", 26.82], ["theremin", 10.71], ["trombone", 7.77]], [["machine gun", 16.76], ["synthesizer", 13.69], ["music", 11.99]], null, [["music", 62.02], ["electronic music", 3.5], ["eruption", 2.69]]], "duration": [6.45, 9.45, 0.2, 0.77, 0.76, 17.95, 22.2, 3.21, 25.95, 5.75, 0.88, 26.95]} \ No newline at end of file diff --git a/annotations_filtered/i4GeD9FWdG4_filtered.json b/annotations_filtered/i4GeD9FWdG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71cc3f4bda65f191d935a828576ec6d837cf5628 --- /dev/null +++ b/annotations_filtered/i4GeD9FWdG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.86], [9.0, 9.93], [14.0, 15.18], [17.0, 18.6], [20.0, 20.6], [27.0, 28.46], [32.0, 33.05], [35.0, 39.46], [42.0, 41.81], [44.0, 44.42], [45.0, 45.08], [49.0, 49.38], [53.0, 55.19], [57.0, 58.06], [60.0, 60.64], [64.0, 64.2], [66.0, 69.69], [70.0, 74.17], [77.0, 80.52], [82.0, 84.16], [84.0, 84.72], [86.0, 86.14], [86.0, 87.05]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 69.47, 88.1, 80.64, 88.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["rumble", 6.95], ["stomach rumble", 6.94], ["speech", 6.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.93, 1.18, 1.6, 0.6, 1.46, 1.05, 4.46, -0.19, 0.42, 0.08, 0.38, 2.19, 1.06, 0.64, 0.2, 3.69, 4.17, 3.52, 2.16, 0.72, 0.14, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/i4M2tehIejI_filtered.json b/annotations_filtered/i4M2tehIejI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6523949fd751962a76f454160821e91bfa645164 --- /dev/null +++ b/annotations_filtered/i4M2tehIejI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 33.22], [34.0, 41.0], [43.0, 45.18], [48.0, 57.35], [58.0, 97.63]], "keep_status": [false, false, false, false, false], "silence_prob": [72.6, 96.77, 99.76, 58.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [4.22, 7.0, 2.18, 9.35, 39.63]} \ No newline at end of file diff --git a/annotations_filtered/i4NIiCSEiTg_filtered.json b/annotations_filtered/i4NIiCSEiTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c72f7d29f5f10340fb025a7a62dc6e56307ccbcd --- /dev/null +++ b/annotations_filtered/i4NIiCSEiTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [6.0, 6.08], [11.0, 11.65], [20.0, 20.83], [21.0, 30.48], [32.0, 32.44], [35.0, 41.69], [44.0, 45.0], [46.0, 47.71], [48.0, 48.86], [49.0, 52.07], [53.0, 54.09], [54.0, 54.67], [55.0, 56.13], [57.0, 57.82], [59.0, 61.33], [64.0, 65.67], [68.0, 73.84], [79.0, 87.59], [88.0, 91.74], [93.0, 96.15], [97.0, 98.54], [100.0, 111.79], [113.0, 114.12], [115.0, 123.87], [126.0, 126.1], [129.0, 130.77]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 49.87, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 84.07, 61.97, 76.53, 83.7, 0.0, 38.72, 0.0, 40.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.88], ["guitar", 9.8], ["singing bowl", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.5], ["hum", 7.69], ["cello", 4.24]], null, [["music", 45.64], ["hum", 4.52], ["musical instrument", 3.6]], null, null], "duration": [0.48, 0.08, 0.65, 0.83, 9.48, 0.44, 6.69, 1.0, 1.71, 0.86, 3.07, 1.09, 0.67, 1.13, 0.82, 2.33, 1.67, 5.84, 8.59, 3.74, 3.15, 1.54, 11.79, 1.12, 8.87, 0.1, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/i4NRgUeziqA_filtered.json b/annotations_filtered/i4NRgUeziqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..733c6ec958d40182a22a7fc9a3baaade45095a32 --- /dev/null +++ b/annotations_filtered/i4NRgUeziqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 79.54], [84.0, 116.07], [117.0, 120.28], [121.0, 121.54], [124.0, 125.05]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.52], ["eruption", 11.52], ["explosion", 5.15]], null, null], "duration": [75.54, 32.07, 3.28, 0.54, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/i4h9xcdtyrE_filtered.json b/annotations_filtered/i4h9xcdtyrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58ca485ddd0c0c21870594dfbf99643991b653c8 --- /dev/null +++ b/annotations_filtered/i4h9xcdtyrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [16.0, 16.34], [17.0, 18.42], [25.0, 25.29], [33.0, 33.89], [36.0, 36.27], [39.0, 44.73], [45.0, 45.5], [46.0, 45.93], [50.0, 51.11], [52.0, 52.0], [52.0, 52.32], [53.0, 53.3], [61.0, 61.05], [81.0, 81.72], [83.0, 83.44], [84.0, 84.27], [111.0, 111.27], [111.0, 116.19], [118.0, 119.18], [120.0, 120.34], [123.0, 123.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.2], ["sidetone", 2.38], ["inside, small room", 1.45]], null, null, null], "duration": [0.88, 0.34, 1.42, 0.29, 0.89, 0.27, 5.73, 0.5, -0.07, 1.11, 0.0, 0.32, 0.3, 0.05, 0.72, 0.44, 0.27, 0.27, 5.19, 1.18, 0.34, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/i5Y6BTlx37s_filtered.json b/annotations_filtered/i5Y6BTlx37s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f55dfd1a74c2a03146798eaf0dcbeab88b582e55 --- /dev/null +++ b/annotations_filtered/i5Y6BTlx37s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.33], [16.0, 17.05], [19.0, 19.63], [26.0, 37.83], [39.0, 40.58], [46.0, 50.5], [53.0, 58.45], [60.0, 60.42]], "keep_status": [false, false, false, true, false, true, false, false], "silence_prob": [76.7, 0.0, 0.0, 37.62, 0.0, 35.89, 35.22, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.19], ["hum", 14.35], ["gong", 11.92]], null, [["cattle, bovinae", 23.37], ["moo", 17.69], ["livestock, farm animals, working animals", 14.29]], [["music", 58.48], ["theremin", 9.94], ["speech", 6.05]], null], "duration": [7.33, 1.05, 0.63, 11.83, 1.58, 4.5, 5.45, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/i5dTE5dgWOw_filtered.json b/annotations_filtered/i5dTE5dgWOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b96b967e4703cc639dc5bdded1beaee811e3bbe --- /dev/null +++ b/annotations_filtered/i5dTE5dgWOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[84.0, 93.66], [95.0, 179.34], [184.0, 184.5], [187.0, 188.03], [189.0, 190.38], [191.0, 208.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.22, 0.0, 0.0, 0.0, 0.0, 30.58], "audiomae_on_audioset": [[["music", 40.22], ["hum", 24.9], ["throbbing", 9.57]], null, null, null, null, [["speech", 63.8], ["hum", 11.05], ["music", 7.46]]], "duration": [9.66, 84.34, 0.5, 1.03, 1.38, 17.95]} \ No newline at end of file diff --git a/annotations_filtered/i5j1wWY-qus_filtered.json b/annotations_filtered/i5j1wWY-qus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c759519e7d54cd7874b4f58e2520a5b3736bbb4c --- /dev/null +++ b/annotations_filtered/i5j1wWY-qus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.5], [12.0, 11.67], [12.0, 13.49], [16.0, 16.28], [17.0, 19.3], [23.0, 23.55], [28.0, 33.47], [36.0, 37.54], [39.0, 40.12], [43.0, 44.66], [48.0, 49.52], [50.0, 52.0], [56.0, 57.1], [65.0, 65.11]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [34.88, 0.0, 0.0, 0.0, 34.23, 0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 44.91], ["hum", 7.62], ["mains hum", 4.51]], null, null, null, [["cattle, bovinae", 24.86], ["livestock, farm animals, working animals", 16.11], ["moo", 15.28]], null, [["livestock, farm animals, working animals", 35.7], ["cattle, bovinae", 24.48], ["moo", 15.94]], null, null, null, null, [["livestock, farm animals, working animals", 20.39], ["cattle, bovinae", 9.35], ["sidetone", 6.12]], null, null], "duration": [2.5, -0.33, 1.49, 0.28, 2.3, 0.55, 5.47, 1.54, 1.12, 1.66, 1.52, 2.0, 1.1, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/i5jTH89HjTA_filtered.json b/annotations_filtered/i5jTH89HjTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c74cc7c37ed488683997d88675159271b6e5cfb --- /dev/null +++ b/annotations_filtered/i5jTH89HjTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [21.0, 22.17], [23.0, 26.42], [28.0, 28.59], [31.0, 31.46], [43.0, 44.19], [45.0, 49.94], [53.0, 53.2], [59.0, 79.95], [81.0, 90.19], [92.0, 94.1], [117.0, 118.37], [119.0, 123.16], [124.0, 126.18], [127.0, 128.39], [132.0, 132.88], [136.0, 136.88]], "keep_status": [false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.4, 0.0, 0.0, 0.0, 43.77, 0.0, 31.21, 42.42, 53.78, 0.0, 64.86, 65.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 32.88], ["mains hum", 29.34], ["throbbing", 8.61]], null, null, null, [["fly, housefly", 29.01], ["frog", 25.17], ["insect", 12.64]], null, [["music", 49.38], ["theremin", 8.11], ["brass instrument", 5.95]], [["bee, wasp, etc.", 40.04], ["fly, housefly", 14.39], ["speech", 13.82]], null, null, null, null, null, null, null], "duration": [0.1, 1.17, 3.42, 0.59, 0.46, 1.19, 4.94, 0.2, 20.95, 9.19, 2.1, 1.37, 4.16, 2.18, 1.39, 0.88, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/i5mSHPKEbas_filtered.json b/annotations_filtered/i5mSHPKEbas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee024c25bc08edc47fcbe394a48506d56f7ac4 --- /dev/null +++ b/annotations_filtered/i5mSHPKEbas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [10.0, 13.12], [16.0, 16.58], [17.0, 17.79], [19.0, 19.87], [21.0, 21.02], [23.0, 48.68], [50.0, 50.43], [51.0, 51.6], [52.0, 54.14], [55.0, 56.07], [57.0, 58.4], [59.0, 62.13], [64.0, 67.0], [68.0, 69.48], [70.0, 70.26], [78.0, 78.7], [80.0, 81.18], [85.0, 84.97], [86.0, 87.61], [88.0, 88.92], [90.0, 91.5], [93.0, 94.15], [94.0, 94.69], [98.0, 98.79], [100.0, 101.01], [102.0, 105.63], [106.0, 108.18], [109.0, 109.83], [111.0, 112.51], [114.0, 117.75], [118.0, 119.89], [121.0, 122.72], [124.0, 125.95]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 98.36, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 25.59], ["fly, housefly", 11.73], ["radio", 7.79]], null, null, null, null, null, null, null, null, null, null, null, [["radio", 22.56], ["moo", 11.1], ["cattle, bovinae", 9.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 3.12, 0.58, 0.79, 0.87, 0.02, 25.68, 0.43, 0.6, 2.14, 1.07, 1.4, 3.13, 3.0, 1.48, 0.26, 0.7, 1.18, -0.03, 1.61, 0.92, 1.5, 1.15, 0.69, 0.79, 1.01, 3.63, 2.18, 0.83, 1.51, 3.75, 1.89, 1.72, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/i6OCtSqrOQ0_filtered.json b/annotations_filtered/i6OCtSqrOQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e7ff120828c9cf0ff7b37667fe0072f1a4b99b8 --- /dev/null +++ b/annotations_filtered/i6OCtSqrOQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.94], [18.0, 18.49], [20.0, 21.79], [23.0, 25.96], [29.0, 51.12], [53.0, 55.93], [63.0, 64.05], [65.0, 65.11], [67.0, 67.29], [68.0, 69.77], [71.0, 71.09], [72.0, 77.6], [80.0, 80.77], [83.0, 84.18], [85.0, 85.62], [88.0, 89.9], [90.0, 90.1], [95.0, 100.95], [105.0, 106.17], [107.0, 107.77], [116.0, 116.88], [118.0, 118.37], [121.0, 123.42], [124.0, 125.27], [127.0, 137.35], [138.0, 142.57], [144.0, 144.17], [152.0, 160.19]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.32, 41.91, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 44.6, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 36.25, 33.75, 0.0, 33.26], "audiomae_on_audioset": [null, null, null, [["hum", 21.47], ["creak", 16.66], ["throbbing", 10.75]], [["synthesizer", 23.99], ["music", 16.39], ["effects unit", 7.47]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.97], ["beatboxing", 28.26], ["vocal music", 7.02]], null, null, null, null, null, null, [["dial tone", 42.47], ["speech", 33.27], ["burping, eructation", 6.19]], [["speech", 50.23], ["moo", 8.31], ["cattle, bovinae", 8.28]], null, [["speech", 66.96], ["sidetone", 6.69], ["radio", 4.21]]], "duration": [1.94, 0.49, 1.79, 2.96, 22.12, 2.93, 1.05, 0.11, 0.29, 1.77, 0.09, 5.6, 0.77, 1.18, 0.62, 1.9, 0.1, 5.95, 1.17, 0.77, 0.88, 0.37, 2.42, 1.27, 10.35, 4.57, 0.17, 8.19]} \ No newline at end of file diff --git a/annotations_filtered/i6klSHVWbrk_filtered.json b/annotations_filtered/i6klSHVWbrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b271be3660b92ca6623f89513ff7c9ad84e7d54e --- /dev/null +++ b/annotations_filtered/i6klSHVWbrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.95], [23.0, 31.94], [42.0, 75.17]], "keep_status": [false, true, false], "silence_prob": [30.62, 31.85, 0.0], "audiomae_on_audioset": [[["whale vocalization", 79.55], ["noise", 3.06], ["stomach rumble", 2.88]], [["hum", 31.95], ["speech", 12.99], ["music", 12.65]], null], "duration": [4.95, 8.94, 33.17]} \ No newline at end of file diff --git a/annotations_filtered/i6n8VyqaCQ4_filtered.json b/annotations_filtered/i6n8VyqaCQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ac75bb1afe0cc0200e11086b2b6e6ac84895d52 --- /dev/null +++ b/annotations_filtered/i6n8VyqaCQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.29], [6.0, 6.64], [9.0, 8.94], [17.0, 16.95], [18.0, 18.93], [20.0, 21.25], [23.0, 24.7], [26.0, 27.41], [34.0, 34.72], [37.0, 37.66], [38.0, 38.64], [40.0, 40.76], [42.0, 42.04], [45.0, 49.71], [51.0, 52.03], [55.0, 55.75], [64.0, 75.1], [78.0, 79.69], [82.0, 83.02], [84.0, 92.08], [93.0, 94.29], [95.0, 105.44], [106.0, 107.92], [110.0, 115.52], [117.0, 117.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 52.98, 0.0, 0.0, 90.08, 0.0, 66.63, 0.0, 91.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.29, 0.64, -0.06, -0.05, 0.93, 1.25, 1.7, 1.41, 0.72, 0.66, 0.64, 0.76, 0.04, 4.71, 1.03, 0.75, 11.1, 1.69, 1.02, 8.08, 1.29, 10.44, 1.92, 5.52, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/i6oNzS6kCR8_filtered.json b/annotations_filtered/i6oNzS6kCR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..938ec32a033bc4a9e36482ad1105607487383dd4 --- /dev/null +++ b/annotations_filtered/i6oNzS6kCR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.41], [9.0, 11.57], [14.0, 13.88], [15.0, 16.01], [19.0, 20.78], [23.0, 23.7], [25.0, 28.71], [31.0, 31.97], [33.0, 33.52], [34.0, 100.47], [102.0, 101.83]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [35.46, 42.74, 0.0, 0.0, 0.0, 0.0, 44.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 24.62], ["insect", 16.06], ["mains hum", 9.96]], [["speech", 14.46], ["music", 12.95], ["electric shaver, electric razor", 12.1]], null, null, null, null, [["music", 29.52], ["speech", 18.63], ["ding", 4.24]], null, null, null, null], "duration": [5.41, 2.57, -0.12, 1.01, 1.78, 0.7, 3.71, 0.97, 0.52, 66.47, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/i6ymVjU5hno_filtered.json b/annotations_filtered/i6ymVjU5hno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc2f47efbbc82a462ae1cc1d4e0e6c6069998929 --- /dev/null +++ b/annotations_filtered/i6ymVjU5hno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.72], [9.0, 9.0], [10.0, 11.5], [13.0, 14.62], [16.0, 19.23], [21.0, 22.65], [24.0, 26.92], [28.0, 30.47], [31.0, 43.11], [45.0, 45.25], [48.0, 48.74], [50.0, 50.57], [52.0, 52.29], [53.0, 54.41], [55.0, 56.71], [59.0, 61.48], [64.0, 66.56], [69.0, 70.44], [72.0, 72.72], [74.0, 76.3], [79.0, 81.33], [84.0, 85.43], [89.0, 89.51], [90.0, 93.31], [95.0, 96.3], [97.0, 98.47], [101.0, 102.64], [104.0, 105.36], [107.0, 107.43], [109.0, 109.48], [110.0, 111.65], [113.0, 113.8], [116.0, 115.67], [118.0, 119.74], [121.0, 123.6], [127.0, 129.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [64.52, 0.0, 0.0, 0.0, 92.48, 0.0, 73.36, 85.9, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.12, 55.89, 0.0, 0.0, 59.42, 83.88, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.95, 37.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 44.59], ["effects unit", 24.91], ["guitar", 8.76]], null, null, null, null, null, null, [["mains hum", 32.97], ["sidetone", 22.37], ["hum", 21.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 30.55], ["speech", 16.95], ["hum", 13.4]], [["speech", 62.34], ["mains hum", 5.85], ["noise", 4.55]]], "duration": [3.72, 0.0, 1.5, 1.62, 3.23, 1.65, 2.92, 2.47, 12.11, 0.25, 0.74, 0.57, 0.29, 1.41, 1.71, 2.48, 2.56, 1.44, 0.72, 2.3, 2.33, 1.43, 0.51, 3.31, 1.3, 1.47, 1.64, 1.36, 0.43, 0.48, 1.65, 0.8, -0.33, 1.74, 2.6, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/i7AUpGXLDdk_filtered.json b/annotations_filtered/i7AUpGXLDdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc10456d4dad14bd393044e22209abebef12ff51 --- /dev/null +++ b/annotations_filtered/i7AUpGXLDdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.22], [36.0, 37.72], [53.0, 52.91], [63.0, 63.71]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.22, 1.72, -0.09, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/i7Jg_6-fYF8_filtered.json b/annotations_filtered/i7Jg_6-fYF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c603b9c662a3b6532b97e01632555dc8a937a9f --- /dev/null +++ b/annotations_filtered/i7Jg_6-fYF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.24], [6.0, 11.72], [14.0, 32.58], [35.0, 36.88], [41.0, 41.05], [42.0, 42.72], [45.0, 45.08], [46.0, 46.5], [48.0, 50.04], [54.0, 54.08], [56.0, 56.57], [62.0, 67.98], [69.0, 76.77], [80.0, 81.26], [86.0, 86.31], [88.0, 118.2], [120.0, 152.44]], "keep_status": [false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 32.58, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 46.29, 51.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.86], ["livestock, farm animals, working animals", 6.42], ["fly, housefly", 5.37]], [["speech", 27.71], ["explosion", 21.89], ["artillery fire", 11.64]], null, null, null, null, null, [["speech", 32.85], ["whack, thwack", 23.92], ["hum", 5.26]], null, null, [["speech", 49.74], ["hum", 11.0], ["mains hum", 5.22]], null, null, null, null, null], "duration": [0.24, 5.72, 18.58, 1.88, 0.05, 0.72, 0.08, 0.5, 2.04, 0.08, 0.57, 5.98, 7.77, 1.26, 0.31, 30.2, 32.44]} \ No newline at end of file diff --git a/annotations_filtered/i7KcAEPxDwQ_filtered.json b/annotations_filtered/i7KcAEPxDwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74d3013bf8abd41040d2412b51f917ae0e123121 --- /dev/null +++ b/annotations_filtered/i7KcAEPxDwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 10.18], [11.0, 34.86], [43.0, 43.93], [48.0, 56.94], [59.0, 74.76], [78.0, 78.83]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.04, 0.0, 35.53, 69.74, 0.0], "audiomae_on_audioset": [null, null, [["speech", 73.25], ["music", 16.39], ["didgeridoo", 2.4]], null, [["hum", 50.14], ["mains hum", 27.54], ["music", 4.37]], null, null], "duration": [0.16, 0.18, 23.86, 0.93, 8.94, 15.76, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/i7hF7BAKV_I_filtered.json b/annotations_filtered/i7hF7BAKV_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6c1e4720cda21df593e885614f4d1258c9a5c35 --- /dev/null +++ b/annotations_filtered/i7hF7BAKV_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 55.81], [56.0, 56.81], [57.0, 62.33], [65.0, 82.26], [83.0, 83.91], [84.0, 86.36]], "keep_status": [true, false, false, false, false, false], "silence_prob": [28.66, 0.0, 34.68, 36.37, 0.0, 53.72], "audiomae_on_audioset": [[["music", 45.12], ["speech", 12.72], ["beatboxing", 6.75]], null, [["music", 52.12], ["speech", 14.91], ["didgeridoo", 4.78]], [["speech", 34.56], ["fart", 29.46], ["fly, housefly", 12.8]], null, null], "duration": [24.81, 0.81, 5.33, 17.26, 0.91, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/i7hk-TupE5g_filtered.json b/annotations_filtered/i7hk-TupE5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..454e2c5769035d274cb95158b56829554abf89c8 --- /dev/null +++ b/annotations_filtered/i7hk-TupE5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [6.0, 9.0], [14.0, 15.67], [17.0, 18.18], [20.0, 19.8], [21.0, 21.47], [23.0, 26.08], [27.0, 29.02], [35.0, 37.1], [40.0, 42.3], [46.0, 47.07], [50.0, 52.07], [54.0, 55.38], [62.0, 62.95], [64.0, 65.45], [68.0, 68.45], [70.0, 70.73], [72.0, 74.49], [76.0, 76.28], [77.0, 77.43], [80.0, 81.06], [83.0, 83.52], [85.0, 85.75], [87.0, 88.74], [98.0, 98.24], [101.0, 102.27], [105.0, 105.68], [110.0, 112.01], [114.0, 115.15], [120.0, 121.32], [127.0, 127.41], [131.0, 131.46]], "keep_status": [false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.42, 0.0, 0.0, 0.0, 0.0, 38.37, 37.3, 33.25, 36.02, 0.0, 33.4, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.06], ["didgeridoo", 33.52], ["hum", 3.51]], null, null, null, null, [["mains hum", 47.05], ["hum", 35.17], ["music", 4.99]], [["wind instrument, woodwind instrument", 9.45], ["shofar", 8.14], ["speech", 7.77]], [["music", 23.11], ["mains hum", 11.33], ["hum", 10.84]], [["mains hum", 13.68], ["hum", 11.76], ["music", 7.19]], null, [["speech", 54.41], ["music", 13.1], ["hum", 7.43]], null, null, null, null, null, [["sidetone", 62.51], ["mains hum", 23.0], ["hum", 6.4]], null, null, null, null, null, null, null, null, null, [["music", 42.51], ["didgeridoo", 5.5], ["speech", 5.18]], null, null, null, null], "duration": [0.37, 3.0, 1.67, 1.18, -0.2, 0.47, 3.08, 2.02, 2.1, 2.3, 1.07, 2.07, 1.38, 0.95, 1.45, 0.45, 0.73, 2.49, 0.28, 0.43, 1.06, 0.52, 0.75, 1.74, 0.24, 1.27, 0.68, 2.01, 1.15, 1.32, 0.41, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/i7tGEEWQIhQ_filtered.json b/annotations_filtered/i7tGEEWQIhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbbc19ba4701aa57eed283dd270048c3cbb808e6 --- /dev/null +++ b/annotations_filtered/i7tGEEWQIhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 5.56], [6.0, 7.18], [9.0, 12.38], [14.0, 14.12], [15.0, 18.79], [20.0, 21.78], [23.0, 25.34], [28.0, 29.67], [31.0, 31.72], [32.0, 33.17], [37.0, 37.67], [38.0, 38.92], [40.0, 40.63], [44.0, 49.1], [50.0, 51.76], [52.0, 53.77], [54.0, 56.56], [59.0, 60.27], [63.0, 63.14], [69.0, 70.06], [71.0, 71.93], [95.0, 99.57], [101.0, 103.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.68, 0.0, 82.07, 0.0, 90.08, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 43.38, 0.0, 0.0, 0.0, 0.0, 100.0, 82.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 29.34], ["sine wave", 16.85], ["sidetone", 10.24]], null, null, null, null, null, null, null, null, null, [["sidetone", 58.48], ["speech", 23.71], ["dial tone", 3.99]], null, null, null, null, null, null], "duration": [0.47, 2.56, 1.18, 3.38, 0.12, 3.79, 1.78, 2.34, 1.67, 0.72, 1.17, 0.67, 0.92, 0.63, 5.1, 1.76, 1.77, 2.56, 1.27, 0.14, 1.06, 0.93, 4.57, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/i7vKbmKF9VI_filtered.json b/annotations_filtered/i7vKbmKF9VI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab2fceed2e8718a85551ebcc2fd02d964eaaf767 --- /dev/null +++ b/annotations_filtered/i7vKbmKF9VI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [11.0, 12.9], [13.0, 14.84], [16.0, 17.83], [29.0, 30.06], [34.0, 34.16], [40.0, 43.11], [44.0, 44.71], [50.0, 57.4], [59.0, 60.64], [62.0, 63.41], [70.0, 71.05], [73.0, 73.3], [77.0, 78.51], [91.0, 91.25], [93.0, 97.41], [98.0, 99.42], [101.0, 104.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.9, 1.84, 1.83, 1.06, 0.16, 3.11, 0.71, 7.4, 1.64, 1.41, 1.05, 0.3, 1.51, 0.25, 4.41, 1.42, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/i812ZsyyeLg_filtered.json b/annotations_filtered/i812ZsyyeLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32e2a10aeee56e7654ce0362d7def06d093f5d24 --- /dev/null +++ b/annotations_filtered/i812ZsyyeLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 7.96], [9.0, 10.74], [12.0, 12.88], [17.0, 17.52], [19.0, 19.55], [22.0, 23.41], [24.0, 24.63], [26.0, 46.16], [48.0, 65.74], [66.0, 66.45], [68.0, 68.59], [70.0, 69.82], [70.0, 70.33], [72.0, 73.13], [75.0, 74.92], [77.0, 77.41], [79.0, 78.97], [82.0, 84.5], [85.0, 85.63], [89.0, 89.7], [90.0, 92.13], [93.0, 94.56], [101.0, 101.66], [106.0, 114.59], [115.0, 116.34], [117.0, 123.74], [125.0, 125.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 96.29, 0.0, 0.0, 73.36, 0.0, 33.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["mosquito", 67.28], ["fly, housefly", 21.75], ["insect", 9.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 18.45], ["cattle, bovinae", 17.78], ["moo", 14.76]], null], "duration": [0.57, 3.96, 1.74, 0.88, 0.52, 0.55, 1.41, 0.63, 20.16, 17.74, 0.45, 0.59, -0.18, 0.33, 1.13, -0.08, 0.41, -0.03, 2.5, 0.63, 0.7, 2.13, 1.56, 0.66, 8.59, 1.34, 6.74, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/i94ldGNNSQ0_filtered.json b/annotations_filtered/i94ldGNNSQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..707f10025ff6ec4ee737e087157585d5b6b3bfab --- /dev/null +++ b/annotations_filtered/i94ldGNNSQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 38.45], [40.0, 40.71], [41.0, 60.84], [63.0, 112.45], [112.0, 112.55]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 29.41], ["music", 17.12], ["mains hum", 13.52]], null, null], "duration": [35.45, 0.71, 19.84, 49.45, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/i9DMpMCCxuE_filtered.json b/annotations_filtered/i9DMpMCCxuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ea36af102db8259b8c107e2637c819ee2202bc5 --- /dev/null +++ b/annotations_filtered/i9DMpMCCxuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.17], [14.0, 15.15], [17.0, 17.17], [27.0, 28.09], [32.0, 33.88], [34.0, 38.97], [42.0, 42.99]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 52.34], ["speech", 33.56], ["synthesizer", 5.91]], null], "duration": [1.17, 1.15, 0.17, 1.09, 1.88, 4.97, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/i9Iy9amffa4_filtered.json b/annotations_filtered/i9Iy9amffa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185cd4f27e14c4977964e257a9ce804805c7bd60 --- /dev/null +++ b/annotations_filtered/i9Iy9amffa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.4], [13.0, 13.05], [15.0, 15.9], [16.0, 16.7], [17.0, 17.68], [19.0, 19.53], [21.0, 21.59], [23.0, 24.17], [27.0, 26.81], [28.0, 28.14], [29.0, 29.49], [32.0, 32.85], [45.0, 47.6], [60.0, 61.38], [62.0, 62.43], [70.0, 69.94], [91.0, 92.7], [94.0, 94.54], [98.0, 111.82], [113.0, 144.31], [148.0, 150.16], [152.0, 153.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.25, 0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 0.0, 31.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.94], ["trombone", 19.42], ["brass instrument", 17.97]], null, null, null, null, null, [["music", 55.24], ["whistling", 29.99], ["theremin", 6.47]], null, [["music", 22.85], ["cacophony", 6.41], ["radio", 6.04]], null], "duration": [0.4, 0.05, 0.9, 0.7, 0.68, 0.53, 0.59, 1.17, -0.19, 0.14, 0.49, 0.85, 2.6, 1.38, 0.43, -0.06, 1.7, 0.54, 13.82, 31.31, 2.16, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/i9KJXFbkMH0_filtered.json b/annotations_filtered/i9KJXFbkMH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b27c6aa3169ce81c1d356eb01538859384fa0e77 --- /dev/null +++ b/annotations_filtered/i9KJXFbkMH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [4.0, 3.91], [7.0, 7.2], [12.0, 80.15]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.08, -0.09, 0.2, 68.15]} \ No newline at end of file diff --git a/annotations_filtered/i9NIwHKBqy0_filtered.json b/annotations_filtered/i9NIwHKBqy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b49d669da925a0376fe95ff0fee95ddb5303a5a1 --- /dev/null +++ b/annotations_filtered/i9NIwHKBqy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.67], [25.0, 30.38], [31.0, 37.25], [39.0, 39.85], [53.0, 55.53], [61.0, 61.47], [64.0, 64.64], [70.0, 70.92], [74.0, 93.9], [95.0, 99.55], [114.0, 127.57], [130.0, 145.07], [146.0, 146.48], [148.0, 157.89], [158.0, 157.94], [158.0, 158.53]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.65, 32.77, 0.0, 31.91, 0.0, 0.0, 0.0, 30.01, 29.58, 29.74, 30.02, 0.0, 29.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 45.08], ["speech", 14.03], ["animal", 6.72]], [["whale vocalization", 15.04], ["theremin", 9.6], ["speech", 8.74]], null, [["music", 71.97], ["speech", 11.51], ["musical instrument", 2.81]], null, null, null, [["music", 51.49], ["speech", 18.0], ["hum", 8.15]], [["theremin", 53.37], ["music", 33.38], ["musical instrument", 3.0]], [["music", 65.04], ["speech", 7.64], ["didgeridoo", 4.63]], [["music", 69.53], ["musical instrument", 10.85], ["theremin", 5.6]], null, [["music", 69.01], ["speech", 15.6], ["musical instrument", 1.99]], null, null], "duration": [-0.33, 5.38, 6.25, 0.85, 2.53, 0.47, 0.64, 0.92, 19.9, 4.55, 13.57, 15.07, 0.48, 9.89, -0.06, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/i9_lCyG67Rc_filtered.json b/annotations_filtered/i9_lCyG67Rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b26e42393f80de0089e7f416faafbd3b8886ae --- /dev/null +++ b/annotations_filtered/i9_lCyG67Rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.98], [16.0, 16.93], [23.0, 24.02], [36.0, 36.56], [49.0, 49.57], [52.0, 52.44], [58.0, 61.2], [61.0, 66.88], [70.0, 69.94], [72.0, 71.98], [75.0, 77.18], [82.0, 84.65], [90.0, 92.15]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.16, 32.89, 0.0, 0.0, 31.06, 29.71, 29.9], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 40.74], ["foghorn", 15.5], ["theremin", 9.65]], [["foghorn", 82.07], ["music", 8.62], ["theremin", 2.12]], null, null, [["music", 22.46], ["synthesizer", 8.59], ["foghorn", 8.53]], [["music", 54.1], ["theremin", 28.32], ["musical instrument", 3.37]], [["speech", 41.88], ["vehicle", 5.78], ["crowd", 4.25]]], "duration": [-0.02, 0.93, 1.02, 0.56, 0.57, 0.44, 3.2, 5.88, -0.06, -0.02, 2.18, 2.65, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/i9upvWNN3P8_filtered.json b/annotations_filtered/i9upvWNN3P8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f4999acdbe90014cbfe64367386f04f33f1d7d1 --- /dev/null +++ b/annotations_filtered/i9upvWNN3P8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 17.47], [20.0, 21.15], [23.0, 23.16], [24.0, 24.39], [61.0, 61.5]], "keep_status": [false, false, false, false, false], "silence_prob": [51.12, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [8.47, 1.15, 0.16, 0.39, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/iAMImEbSpDk_filtered.json b/annotations_filtered/iAMImEbSpDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1def95ef0487af4f8c4679b0c20d8cb9dc388f67 --- /dev/null +++ b/annotations_filtered/iAMImEbSpDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 45.91], [47.0, 47.71], [50.0, 55.9], [64.0, 64.34], [65.0, 64.52], [65.0, 64.93], [67.0, 67.2], [70.0, 73.2], [77.0, 81.68], [83.0, 83.69], [93.0, 94.9], [98.0, 100.67], [103.0, 103.45], [104.0, 104.75], [106.0, 105.93], [111.0, 110.74], [121.0, 127.35], [127.0, 127.4], [129.0, 129.34], [134.0, 136.86], [142.0, 142.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.91, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 67.76, 78.38, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 38.78, 0.0, 0.0, 52.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.27], ["boing", 4.54], ["speech", 4.22]], null, null, null, null], "duration": [2.91, 0.71, 5.9, 0.34, -0.48, -0.07, 0.2, 3.2, 4.68, 0.69, 1.9, 2.67, 0.45, 0.75, -0.07, -0.26, 6.35, 0.4, 0.34, 2.86, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/iA_KZwlnrcI_filtered.json b/annotations_filtered/iA_KZwlnrcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c44f17dd7a31daf0b0d8623b860b16e889f2e1f2 --- /dev/null +++ b/annotations_filtered/iA_KZwlnrcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.9], [10.0, 11.11], [12.0, 14.94], [15.0, 18.87], [20.0, 22.15], [23.0, 29.25], [31.0, 34.1], [37.0, 43.65], [44.0, 57.54], [61.0, 64.3], [65.0, 66.12], [68.0, 78.78], [81.0, 126.49], [127.0, 127.79]], "keep_status": [false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [67.0, 0.0, 63.42, 44.93, 57.72, 74.44, 72.16, 31.39, 35.03, 30.71, 0.0, 31.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 46.88], ["whale vocalization", 8.01], ["music", 7.29]], null, null, null, [["music", 27.31], ["electric shaver, electric razor", 19.58], ["speech", 9.52]], [["music", 40.95], ["didgeridoo", 14.58], ["hum", 10.4]], [["hum", 22.51], ["throbbing", 18.8], ["speech", 15.09]], null, [["throbbing", 52.77], ["hum", 17.72], ["music", 11.24]], null, null], "duration": [2.9, 1.11, 2.94, 3.87, 2.15, 6.25, 3.1, 6.65, 13.54, 3.3, 1.12, 10.78, 45.49, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/iAlU6xt7Y_s_filtered.json b/annotations_filtered/iAlU6xt7Y_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3601bb7d165c4645408cc04f0aaeb44bf89b37ee --- /dev/null +++ b/annotations_filtered/iAlU6xt7Y_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [4.0, 5.24], [9.0, 10.35], [11.0, 12.11], [16.0, 15.9], [18.0, 18.91], [19.0, 20.38], [23.0, 25.24], [26.0, 26.42], [27.0, 28.97], [36.0, 37.29], [39.0, 39.16], [41.0, 41.96], [44.0, 45.81], [46.0, 48.59], [49.0, 58.02], [61.0, 65.26], [70.0, 70.39], [78.0, 79.81], [82.0, 85.21], [95.0, 96.21], [97.0, 100.5], [102.0, 106.52], [108.0, 109.86], [114.0, 116.04], [118.0, 119.97], [121.0, 128.78], [130.0, 130.23], [131.0, 138.27], [140.0, 140.05], [140.0, 141.56], [144.0, 144.15], [146.0, 146.7], [147.0, 148.39], [149.0, 149.01], [150.0, 150.87], [152.0, 154.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 87.92, 95.91, 0.0, 0.0, 96.77, 0.0, 85.35, 87.55, 0.0, 50.02, 0.0, 99.26, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.09], ["sidetone", 34.01], ["hum", 7.22]], null, null, null, null, null, null, null, null], "duration": [0.89, 1.24, 1.35, 1.11, -0.1, 0.91, 1.38, 2.24, 0.42, 1.97, 1.29, 0.16, 0.96, 1.81, 2.59, 9.02, 4.26, 0.39, 1.81, 3.21, 1.21, 3.5, 4.52, 1.86, 2.04, 1.97, 7.78, 0.23, 7.27, 0.05, 1.56, 0.15, 0.7, 1.39, 0.01, 0.87, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/iAzMFB3QaBk_filtered.json b/annotations_filtered/iAzMFB3QaBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e4d22e2e43f627c211b0b45500fcf1c3c70ebb4 --- /dev/null +++ b/annotations_filtered/iAzMFB3QaBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [4.0, 5.04], [9.0, 9.73], [13.0, 14.22], [17.0, 17.58], [22.0, 22.0], [24.0, 25.66], [42.0, 43.7], [45.0, 45.91], [54.0, 54.4], [63.0, 63.61], [66.0, 67.12], [68.0, 70.01], [73.0, 74.61], [76.0, 76.99], [77.0, 78.06], [78.0, 84.69], [85.0, 85.67], [86.0, 90.02], [94.0, 95.54], [97.0, 97.73], [98.0, 100.01], [112.0, 112.51], [113.0, 114.79], [121.0, 121.9], [126.0, 128.28], [129.0, 129.44], [141.0, 142.23], [144.0, 147.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 93.6, 0.0, 48.39, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 47.39, 0.0, 0.0, 48.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.26], ["burping, eructation", 14.17], ["speech", 5.18]], null, null, null, null, null, null, [["noise", 18.82], ["whale vocalization", 14.95], ["hum", 12.18]], null, null, [["speech", 47.35], ["hum", 11.26], ["mains hum", 8.43]]], "duration": [1.06, 1.04, 0.73, 1.22, 0.58, 0.0, 1.66, 1.7, 0.91, 0.4, 0.61, 1.12, 2.01, 1.61, 0.99, 1.06, 6.69, 0.67, 4.02, 1.54, 0.73, 2.01, 0.51, 1.79, 0.9, 2.28, 0.44, 1.23, 3.23]} \ No newline at end of file diff --git a/annotations_filtered/iB25eDhWImc_filtered.json b/annotations_filtered/iB25eDhWImc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5439c523141ee56190bb80175c879df7c2157c7a --- /dev/null +++ b/annotations_filtered/iB25eDhWImc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.85], [37.0, 38.89], [39.0, 39.21], [56.0, 57.2], [74.0, 73.6], [76.0, 77.35], [79.0, 81.24]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.62], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [-0.15, 1.89, 0.21, 1.2, -0.4, 1.35, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/iB8YcYRzDdE_filtered.json b/annotations_filtered/iB8YcYRzDdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44df5d178bdd1f1c87b33d1a965e42199dbe5d9b --- /dev/null +++ b/annotations_filtered/iB8YcYRzDdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [4.0, 5.56], [6.0, 7.16], [8.0, 11.18], [12.0, 12.55], [14.0, 14.44], [17.0, 19.13], [20.0, 20.98], [22.0, 22.82], [25.0, 24.93], [27.0, 29.44], [30.0, 35.85], [38.0, 40.39], [41.0, 41.44], [43.0, 44.73], [45.0, 49.22], [50.0, 51.51], [53.0, 54.58], [55.0, 57.86], [59.0, 64.29], [75.0, 75.29], [78.0, 78.68], [79.0, 79.52], [80.0, 79.86], [81.0, 84.01], [86.0, 86.83], [89.0, 92.8], [93.0, 93.8], [98.0, 99.64], [102.0, 101.83], [103.0, 103.49], [104.0, 104.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 61.27, 83.52, 100.0, 0.0, 0.0, 98.86, 0.0, 0.0, 100.0, 95.09, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 1.56, 1.16, 3.18, 0.55, 0.44, 2.13, 0.98, 0.82, -0.07, 2.44, 5.85, 2.39, 0.44, 1.73, 4.22, 1.51, 1.58, 2.86, 5.29, 0.29, 0.68, 0.52, -0.14, 3.01, 0.83, 3.8, 0.8, 1.64, -0.17, 0.49, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/iB8eR7GugQY_filtered.json b/annotations_filtered/iB8eR7GugQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b27d5ff762e570bc839bcc7bdbdf841bc0a707d --- /dev/null +++ b/annotations_filtered/iB8eR7GugQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [17.0, 23.77], [30.0, 31.87], [33.0, 34.16], [38.0, 39.36], [42.0, 61.15], [63.0, 66.95], [68.0, 70.11], [71.0, 71.41]], "keep_status": [false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 45.92, 0.0, 0.0, 0.0, 37.2, 53.84, 56.25, 0.0], "audiomae_on_audioset": [null, [["music", 47.79], ["electronic music", 12.43], ["trance music", 8.33]], null, null, null, [["music", 52.03], ["hum", 8.5], ["electronic music", 8.03]], null, null, null], "duration": [0.56, 6.77, 1.87, 1.16, 1.36, 19.15, 3.95, 2.11, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/iBRhat_CcQM_filtered.json b/annotations_filtered/iBRhat_CcQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7861f3db4770a53f7597e00e5a8ac290e61c0aea --- /dev/null +++ b/annotations_filtered/iBRhat_CcQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.13], [10.0, 10.54], [11.0, 17.49], [18.0, 19.79], [21.0, 22.44], [24.0, 25.35], [27.0, 74.28], [75.0, 77.57], [79.0, 97.85], [98.0, 119.04]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [29.5, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 92.64, 35.48, 50.66], "audiomae_on_audioset": [[["speech", 37.41], ["music", 26.75], ["rumble", 9.44]], null, null, null, null, null, null, null, [["hum", 36.53], ["mains hum", 15.78], ["animal", 4.67]], null], "duration": [6.13, 0.54, 6.49, 1.79, 1.44, 1.35, 47.28, 2.57, 18.85, 21.04]} \ No newline at end of file diff --git a/annotations_filtered/iBSLBl-64fk_filtered.json b/annotations_filtered/iBSLBl-64fk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41a03a932cf84d3522f371e68cfbde21c1440ee7 --- /dev/null +++ b/annotations_filtered/iBSLBl-64fk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.5], [11.0, 12.39], [15.0, 41.4], [43.0, 46.58], [47.0, 72.57]], "keep_status": [false, false, true, false, true], "silence_prob": [0.0, 0.0, 35.04, 38.3, 47.01], "audiomae_on_audioset": [null, null, [["music", 61.12], ["pant", 6.18], ["synthesizer", 2.47]], [["didgeridoo", 37.18], ["music", 29.0], ["speech", 12.62]], [["music", 25.53], ["hum", 12.23], ["fly, housefly", 9.87]]], "duration": [1.5, 1.39, 26.4, 3.58, 25.57]} \ No newline at end of file diff --git a/annotations_filtered/iBSRk-DbhRw_filtered.json b/annotations_filtered/iBSRk-DbhRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d0e6409e3b7848d23da92ecc35992c591c77360 --- /dev/null +++ b/annotations_filtered/iBSRk-DbhRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [6.0, 9.26], [10.0, 11.84], [13.0, 14.45], [15.0, 17.04], [18.0, 19.63], [20.0, 22.11], [23.0, 26.69], [27.0, 27.87], [29.0, 31.24], [33.0, 34.11], [38.0, 38.85], [41.0, 42.74], [44.0, 55.04], [56.0, 59.02], [61.0, 61.47], [63.0, 63.64], [65.0, 65.58], [70.0, 75.63], [78.0, 80.67], [82.0, 83.02], [84.0, 84.67], [86.0, 87.62], [89.0, 91.34], [93.0, 95.39], [97.0, 98.25], [100.0, 100.11], [101.0, 102.44], [104.0, 104.55], [105.0, 106.25], [109.0, 110.59], [112.0, 113.68], [117.0, 118.66], [119.0, 125.9], [127.0, 134.54], [135.0, 135.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.54, 0.0, 0.0, 63.74, 0.0, 100.0, 66.03, 0.0, 99.99, 0.0, 0.0, 0.0, 98.51, 100.0, 0.0, 0.0, 0.0, 81.35, 100.0, 0.0, 0.0, 0.0, 100.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 3.26, 1.84, 1.45, 2.04, 1.63, 2.11, 3.69, 0.87, 2.24, 1.11, 0.85, 1.74, 11.04, 3.02, 0.47, 0.64, 0.58, 5.63, 2.67, 1.02, 0.67, 1.62, 2.34, 2.39, 1.25, 0.11, 1.44, 0.55, 1.25, 1.59, 1.68, 1.66, 6.9, 7.54, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/iBaUUJOO6V8_filtered.json b/annotations_filtered/iBaUUJOO6V8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a47cb12538745e7db860f78ee6c2295a0d6db0cf --- /dev/null +++ b/annotations_filtered/iBaUUJOO6V8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.91], [16.0, 17.37], [18.0, 19.6], [21.0, 21.3], [22.0, 24.19], [26.0, 29.46], [32.0, 34.97], [36.0, 41.1], [42.0, 42.72], [43.0, 44.59], [46.0, 47.17], [50.0, 51.44], [53.0, 55.16], [62.0, 62.38], [63.0, 63.73], [65.0, 83.62], [85.0, 86.36], [88.0, 90.09], [92.0, 95.45], [97.0, 101.49], [102.0, 103.89], [105.0, 114.67], [115.0, 126.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.92, 99.9, 99.62, 94.95, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 41.42, 0.0, 100.0, 99.84, 100.0, 0.0, 31.72, 76.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 35.16], ["whack, thwack", 12.05], ["noise", 11.67]], null, null, null, null, null, [["music", 34.73], ["speech", 28.1], ["wind instrument, woodwind instrument", 12.26]], null], "duration": [0.91, 1.37, 1.6, 0.3, 2.19, 3.46, 2.97, 5.1, 0.72, 1.59, 1.17, 1.44, 2.16, 0.38, 0.73, 18.62, 1.36, 2.09, 3.45, 4.49, 1.89, 9.67, 11.77]} \ No newline at end of file diff --git a/annotations_filtered/iBbWqmzzKMU_filtered.json b/annotations_filtered/iBbWqmzzKMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f8dbe2e13f6a274adc1c810ac7fd0fcd4a08da9 --- /dev/null +++ b/annotations_filtered/iBbWqmzzKMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.17], [5.0, 5.88], [8.0, 8.5], [11.0, 10.81], [13.0, 16.41], [23.0, 23.41], [24.0, 24.38], [26.0, 26.22], [27.0, 27.65], [29.0, 30.69], [32.0, 33.71], [35.0, 36.34], [39.0, 41.57], [45.0, 44.66], [46.0, 46.16], [49.0, 49.52], [53.0, 53.23], [54.0, 56.84], [57.0, 57.72], [58.0, 59.83], [62.0, 62.18], [66.0, 67.54], [70.0, 71.96], [77.0, 77.41], [82.0, 82.36], [85.0, 85.5], [87.0, 87.45], [89.0, 91.02], [94.0, 95.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.34, 0.0, 0.0, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.05, 0.0, 0.0, 0.0, 0.0, 36.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 0.0], "audiomae_on_audioset": [[["synthesizer", 28.04], ["music", 27.09], ["speech", 12.67]], null, null, null, [["speech", 68.08], ["hum", 7.91], ["mains hum", 5.18]], null, null, null, null, null, null, null, [["sine wave", 39.34], ["chirp tone", 23.74], ["tuning fork", 10.66]], null, null, null, null, [["music", 49.71], ["effects unit", 7.96], ["synthesizer", 5.3]], null, null, null, null, null, null, null, null, null, [["hum", 18.79], ["sine wave", 11.63], ["mains hum", 10.62]], null], "duration": [2.17, 0.88, 0.5, -0.19, 3.41, 0.41, 0.38, 0.22, 0.65, 1.69, 1.71, 1.34, 2.57, -0.34, 0.16, 0.52, 0.23, 2.84, 0.72, 1.83, 0.18, 1.54, 1.96, 0.41, 0.36, 0.5, 0.45, 2.02, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/iBptyagVaEQ_filtered.json b/annotations_filtered/iBptyagVaEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b32bb220dfa3d981fae4b0e8e6b5a64bed92b0e4 --- /dev/null +++ b/annotations_filtered/iBptyagVaEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.36], [24.0, 26.76], [28.0, 33.61], [36.0, 44.14], [46.0, 51.12], [52.0, 73.16], [74.0, 90.61], [91.0, 99.67]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [97.64, 98.1, 96.42, 97.83, 97.83, 97.11, 93.45, 95.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [6.36, 2.76, 5.61, 8.14, 5.12, 21.16, 16.61, 8.67]} \ No newline at end of file diff --git a/annotations_filtered/iCfBiIzWG9g_filtered.json b/annotations_filtered/iCfBiIzWG9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dd2d82bd98d194814d43ab34c8260537769972d --- /dev/null +++ b/annotations_filtered/iCfBiIzWG9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [3.0, 3.38], [5.0, 5.41], [6.0, 8.82], [10.0, 10.34], [11.0, 12.19], [13.0, 14.2], [16.0, 16.17], [20.0, 20.61], [27.0, 30.42], [31.0, 31.89], [32.0, 34.23], [37.0, 37.18], [48.0, 48.02], [49.0, 50.19], [51.0, 61.96], [62.0, 68.55], [70.0, 70.68], [73.0, 73.06], [80.0, 84.1], [88.0, 88.5], [89.0, 88.72], [89.0, 89.31], [90.0, 90.53], [91.0, 91.66], [92.0, 94.8], [97.0, 97.28], [98.0, 98.27], [107.0, 107.06], [108.0, 110.25], [116.0, 116.04], [117.0, 117.42], [118.0, 118.64], [120.0, 120.73], [121.0, 122.44], [123.0, 125.58], [126.0, 127.87]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 32.47, 0.0, 0.0, 0.0, 0.0, 0.0, 33.15, 0.0, 33.39, 0.0, 0.0, 0.0, 33.21, 32.38, 0.0, 0.0, 33.5, 0.0, 0.0, 0.0, 0.0, 0.0, 39.61, 0.0, 0.0, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 43.4, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.46], ["speech", 16.16], ["throbbing", 10.94]], null, null, null, null, null, [["music", 24.27], ["cattle, bovinae", 16.26], ["moo", 14.93]], null, [["music", 31.54], ["throbbing", 12.58], ["hum", 11.34]], null, null, null, [["music", 82.89], ["electronic music", 4.54], ["throbbing", 2.07]], [["music", 57.22], ["throbbing", 21.01], ["hum", 3.42]], null, null, [["music", 66.84], ["throbbing", 10.29], ["hum", 5.0]], null, null, null, null, null, [["didgeridoo", 53.54], ["music", 21.58], ["hum", 4.38]], null, null, null, [["fly, housefly", 56.22], ["insect", 20.67], ["mosquito", 8.0]], null, null, null, null, null, [["hum", 22.98], ["music", 18.92], ["mains hum", 15.6]], null], "duration": [0.13, 0.38, 0.41, 2.82, 0.34, 1.19, 1.2, 0.17, 0.61, 3.42, 0.89, 2.23, 0.18, 0.02, 1.19, 10.96, 6.55, 0.68, 0.06, 4.1, 0.5, -0.28, 0.31, 0.53, 0.66, 2.8, 0.28, 0.27, 0.06, 2.25, 0.04, 0.42, 0.64, 0.73, 1.44, 2.58, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/iCfjoSbWHZM_filtered.json b/annotations_filtered/iCfjoSbWHZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01af625d4e84df6cc6d6f6146575d1a7c3e43ecc --- /dev/null +++ b/annotations_filtered/iCfjoSbWHZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.95], [25.0, 28.93], [34.0, 34.25]], "keep_status": [false, false, false], "silence_prob": [31.14, 42.33, 0.0], "audiomae_on_audioset": [[["music", 62.16], ["sidetone", 5.1], ["electronic music", 2.85]], [["speech", 60.43], ["music", 8.85], ["sidetone", 5.81]], null], "duration": [9.95, 3.93, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/iClIIg_YtAk_filtered.json b/annotations_filtered/iClIIg_YtAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e19fd0d926ccc8a1cc9f29d09b0191eb65c13569 --- /dev/null +++ b/annotations_filtered/iClIIg_YtAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [4.0, 5.17], [6.0, 6.61], [9.0, 9.07], [10.0, 11.2], [13.0, 13.68], [15.0, 16.16], [19.0, 19.67], [23.0, 24.06], [26.0, 26.7], [28.0, 31.16], [33.0, 36.24], [38.0, 40.17], [42.0, 42.69], [44.0, 44.34], [46.0, 46.6], [48.0, 48.64], [51.0, 50.65], [53.0, 54.38], [56.0, 57.86], [60.0, 61.38], [65.0, 65.33], [67.0, 68.05], [71.0, 73.41], [74.0, 74.98], [78.0, 78.58], [81.0, 81.06], [83.0, 83.07], [84.0, 84.62], [89.0, 89.5], [93.0, 93.8], [97.0, 97.41], [98.0, 100.09], [100.0, 101.12], [104.0, 104.01], [105.0, 105.14], [107.0, 107.28], [109.0, 110.1], [114.0, 115.35], [117.0, 118.07], [119.0, 119.23], [122.0, 123.94], [126.0, 127.5], [128.0, 128.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.14, 50.97, 47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 19.99], ["noise", 9.0], ["throbbing", 5.69]], null, [["music", 47.12], ["didgeridoo", 9.97], ["whale vocalization", 5.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.4], ["didgeridoo", 11.86], ["music", 11.6]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 1.17, 0.61, 0.07, 1.2, 0.68, 1.16, 0.67, 1.06, 0.7, 3.16, 3.24, 2.17, 0.69, 0.34, 0.6, 0.64, -0.35, 1.38, 1.86, 1.38, 0.33, 1.05, 2.41, 0.98, 0.58, 0.06, 0.07, 0.62, 0.5, 0.8, 0.41, 2.09, 1.12, 0.01, 0.14, 0.28, 1.1, 1.35, 1.07, 0.23, 1.94, 1.5, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/iCp3nEO3ttU_filtered.json b/annotations_filtered/iCp3nEO3ttU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60e54a16fa05edaf292fa88b3188d7d559059697 --- /dev/null +++ b/annotations_filtered/iCp3nEO3ttU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.46], [15.0, 15.72], [27.0, 26.99], [30.0, 31.46], [34.0, 34.15], [36.0, 37.12], [43.0, 43.11], [44.0, 44.31], [49.0, 50.28], [57.0, 57.75], [66.0, 73.89], [89.0, 89.36], [90.0, 96.08], [98.0, 103.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 40.86, 38.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 51.74], ["whip", 25.93], ["groan", 2.48]], null, [["speech", 63.8], ["thunk", 7.28], ["music", 4.53]], [["speech", 74.1], ["didgeridoo", 3.51], ["music", 3.23]]], "duration": [1.46, 0.72, -0.01, 1.46, 0.15, 1.12, 0.11, 0.31, 1.28, 0.75, 7.89, 0.36, 6.08, 5.18]} \ No newline at end of file diff --git a/annotations_filtered/iD4lY0brr60_filtered.json b/annotations_filtered/iD4lY0brr60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e16a6d7099cc2d48b8887fc6d2a71255d43ee34b --- /dev/null +++ b/annotations_filtered/iD4lY0brr60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 27.73], [30.0, 73.77], [77.0, 108.94]], "keep_status": [true, false, false], "silence_prob": [30.45, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.2], ["musical instrument", 8.33], ["brass instrument", 7.6]], null, null], "duration": [6.73, 43.77, 31.94]} \ No newline at end of file diff --git a/annotations_filtered/iD9tENbIPHg_filtered.json b/annotations_filtered/iD9tENbIPHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b695184b47f19d367705f77859134b325aaaf725 --- /dev/null +++ b/annotations_filtered/iD9tENbIPHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.11], [37.0, 37.13], [41.0, 43.06], [45.0, 45.69], [59.0, 67.86], [70.0, 71.93], [76.0, 76.87], [78.0, 81.99]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 93.76, 0.0, 48.48, 0.0, 0.0, 38.67], "audiomae_on_audioset": [null, null, null, null, [["speech", 59.78], ["hum", 14.27], ["throbbing", 5.95]], null, null, [["chime", 25.98], ["wind chime", 25.44], ["music", 13.47]]], "duration": [1.11, 0.13, 2.06, 0.69, 8.86, 1.93, 0.87, 3.99]} \ No newline at end of file diff --git a/annotations_filtered/iDnE3PV4YNc_filtered.json b/annotations_filtered/iDnE3PV4YNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd272334f2a9d9142ff8981bd01d0430001555a3 --- /dev/null +++ b/annotations_filtered/iDnE3PV4YNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [5.0, 7.5], [9.0, 10.15], [12.0, 18.49], [20.0, 21.83], [23.0, 24.92], [26.0, 27.01], [29.0, 38.38], [43.0, 43.46], [45.0, 45.35], [51.0, 51.63], [55.0, 55.44], [57.0, 62.5], [63.0, 69.62], [70.0, 81.35], [83.0, 89.75], [93.0, 97.33], [98.0, 98.63], [101.0, 100.85], [102.0, 103.84], [108.0, 108.9], [112.0, 116.7], [119.0, 129.95]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 41.83, 0.0, 40.28, 0.0, 0.0, 0.0, 38.22, 0.0, 0.0, 0.0, 0.0, 42.26, 29.14, 29.59, 30.57, 48.19, 0.0, 0.0, 0.0, 0.0, 27.9, 28.48], "audiomae_on_audioset": [null, [["speech", 57.59], ["music", 14.68], ["sidetone", 3.59]], null, [["music", 35.84], ["hum", 14.51], ["throbbing", 11.16]], null, null, null, [["music", 54.63], ["hum", 14.04], ["mains hum", 6.63]], null, null, null, null, [["speech", 29.01], ["music", 22.72], ["hum", 8.43]], [["speech", 23.44], ["music", 20.54], ["rumble", 19.28]], [["music", 39.29], ["speech", 16.64], ["sound effect", 4.57]], [["music", 14.36], ["crack", 11.33], ["speech", 10.97]], [["theremin", 42.57], ["music", 36.77], ["synthesizer", 4.75]], null, null, null, null, [["music", 19.89], ["zipper (clothing)", 18.75], ["mosquito", 13.49]], [["mains hum", 27.65], ["hum", 23.95], ["electric shaver, electric razor", 12.47]]], "duration": [1.6, 2.5, 1.15, 6.49, 1.83, 1.92, 1.01, 9.38, 0.46, 0.35, 0.63, 0.44, 5.5, 6.62, 11.35, 6.75, 4.33, 0.63, -0.15, 1.84, 0.9, 4.7, 10.95]} \ No newline at end of file diff --git a/annotations_filtered/iE9CEAzLPKg_filtered.json b/annotations_filtered/iE9CEAzLPKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..233fea40d17b7a556a74db5f1499706ba65311a6 --- /dev/null +++ b/annotations_filtered/iE9CEAzLPKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 33.47], [36.0, 45.35], [46.0, 46.74], [48.0, 47.7], [49.0, 49.08], [51.0, 64.34], [66.0, 68.66], [69.0, 77.13], [80.0, 82.9], [87.0, 89.29], [91.0, 103.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.97, 100.0, 99.98, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [3.47, 9.35, 0.74, -0.3, 0.08, 13.34, 2.66, 8.13, 2.9, 2.29, 12.0]} \ No newline at end of file diff --git a/annotations_filtered/iEattbpjGG4_filtered.json b/annotations_filtered/iEattbpjGG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75577d57dbf166cb44aebca727110a226086fd8d --- /dev/null +++ b/annotations_filtered/iEattbpjGG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.46], [28.0, 31.28], [31.0, 31.31], [31.0, 31.35], [34.0, 33.76], [34.0, 33.83], [42.0, 42.3], [43.0, 54.92], [55.0, 56.15], [79.0, 79.56], [90.0, 90.69]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.53, 0.0, 0.0, 0.0, 0.0, 0.0, 34.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.49], ["hum", 16.69], ["music", 10.81]], null, null, null, null, null, [["speech", 37.3], ["music", 35.38], ["animal", 3.27]], null, null, null], "duration": [1.46, 3.28, 0.31, 0.35, -0.24, -0.17, 0.3, 11.92, 1.15, 0.56, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/iErVeElswus_filtered.json b/annotations_filtered/iErVeElswus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8774e6a5661ca0ad80dc199d1cfb40b2e7832a52 --- /dev/null +++ b/annotations_filtered/iErVeElswus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.8], [8.0, 9.39], [13.0, 13.71], [19.0, 28.09], [28.0, 31.87], [33.0, 44.59], [45.0, 45.57], [47.0, 61.75], [63.0, 64.27], [65.0, 66.12], [69.0, 70.58], [71.0, 78.63], [79.0, 80.55], [82.0, 84.28], [85.0, 86.86], [88.0, 93.33], [94.0, 131.31]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.19, 98.51, 77.87, 0.0, 46.9, 0.0, 0.0, 0.0, 73.36, 0.0, 62.58, 0.0, 59.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["singing bowl", 28.09], ["speech", 27.43], ["hum", 8.78]], null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.39, 0.71, 9.09, 3.87, 11.59, 0.57, 14.75, 1.27, 1.12, 1.58, 7.63, 1.55, 2.28, 1.86, 5.33, 37.31]} \ No newline at end of file diff --git a/annotations_filtered/iFEr1xsuksI_filtered.json b/annotations_filtered/iFEr1xsuksI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d399f8bbe55e5adb1add3c0a1c9634ef10de9e4 --- /dev/null +++ b/annotations_filtered/iFEr1xsuksI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [20.0, 20.95], [28.0, 28.17], [31.0, 32.07], [33.0, 34.16], [37.0, 36.86], [40.0, 40.69], [44.0, 44.9], [47.0, 47.68], [48.0, 49.13], [50.0, 50.43], [52.0, 54.18], [59.0, 71.96], [73.0, 74.12], [78.0, 79.19], [80.0, 83.79], [85.0, 84.96], [96.0, 97.14], [98.0, 98.69], [101.0, 102.07], [107.0, 132.63], [133.0, 133.42], [137.0, 150.3], [153.0, 163.27], [163.0, 163.39], [169.0, 169.32], [171.0, 171.56], [174.0, 173.91], [176.0, 176.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 99.65, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 33.21, 0.0, 34.2, 32.98, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.79], ["speech", 19.63], ["fart", 8.68]], null, [["music", 34.5], ["hum", 16.1], ["speech", 13.97]], [["music", 57.04], ["speech", 26.7], ["hum", 2.51]], null, null, null, null, null], "duration": [0.64, 0.95, 0.17, 1.07, 1.16, -0.14, 0.69, 0.9, 0.68, 1.13, 0.43, 2.18, 12.96, 1.12, 1.19, 3.79, -0.04, 1.14, 0.69, 1.07, 25.63, 0.42, 13.3, 10.27, 0.39, 0.32, 0.56, -0.09, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/iFKyzbCLQQA_filtered.json b/annotations_filtered/iFKyzbCLQQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7c71261f604ff0c138f01c5b011cd07b9127198 --- /dev/null +++ b/annotations_filtered/iFKyzbCLQQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.77], [6.0, 6.13], [7.0, 7.87], [10.0, 13.27], [15.0, 16.41], [18.0, 18.82], [24.0, 24.93], [27.0, 27.55], [29.0, 29.13], [31.0, 31.46], [33.0, 35.56], [38.0, 38.89], [40.0, 41.47], [43.0, 43.97], [45.0, 46.55], [48.0, 48.78], [50.0, 50.9], [51.0, 50.97], [53.0, 53.33], [54.0, 57.25], [58.0, 62.28], [73.0, 72.87], [84.0, 84.67], [96.0, 96.6], [99.0, 99.59], [100.0, 100.57], [102.0, 101.92], [106.0, 110.86], [112.0, 118.34], [121.0, 121.73], [124.0, 124.39], [125.0, 126.1], [127.0, 127.77], [129.0, 129.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.13, 0.87, 3.27, 1.41, 0.82, 0.93, 0.55, 0.13, 0.46, 2.56, 0.89, 1.47, 0.97, 1.55, 0.78, 0.9, -0.03, 0.33, 3.25, 4.28, -0.13, 0.67, 0.6, 0.59, 0.57, -0.08, 4.86, 6.34, 0.73, 0.39, 1.1, 0.77, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/iF_053JQnQE_filtered.json b/annotations_filtered/iF_053JQnQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b5f2045219722656360ea78e051af56ad466b68 --- /dev/null +++ b/annotations_filtered/iF_053JQnQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.8], [21.0, 21.96], [33.0, 34.28], [45.0, 45.74], [59.0, 59.05], [74.0, 73.94], [79.0, 78.81], [88.0, 90.96], [95.0, 95.66], [97.0, 97.65], [102.0, 101.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 0.96, 1.28, 0.74, 0.05, -0.06, -0.19, 2.96, 0.66, 0.65, -0.29]} \ No newline at end of file diff --git a/annotations_filtered/iFnPpSNqKYU_filtered.json b/annotations_filtered/iFnPpSNqKYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33c2d7ed63fc3fdf66261dba3b8b531003a2f621 --- /dev/null +++ b/annotations_filtered/iFnPpSNqKYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 66.36], [72.0, 73.5], [80.0, 79.59], [82.0, 82.81], [83.0, 89.14], [95.0, 121.22]], "keep_status": [false, false, false, false, false, true], "silence_prob": [33.46, 0.0, 0.0, 0.0, 30.79, 31.14], "audiomae_on_audioset": [[["music", 48.09], ["theremin", 13.51], ["gong", 8.64]], null, null, null, [["music", 77.53], ["musical instrument", 6.07], ["synthesizer", 4.07]], [["music", 33.8], ["livestock, farm animals, working animals", 13.57], ["sheep", 11.73]]], "duration": [22.36, 1.5, -0.41, 0.81, 6.14, 26.22]} \ No newline at end of file diff --git a/annotations_filtered/iFpB2_WOk0Q_filtered.json b/annotations_filtered/iFpB2_WOk0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f233949061a40ce0d652040bf0b9abb45824a19 --- /dev/null +++ b/annotations_filtered/iFpB2_WOk0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [7.0, 7.2], [9.0, 9.8], [13.0, 13.02], [14.0, 14.32], [20.0, 23.5], [24.0, 24.43], [26.0, 26.62], [27.0, 32.36], [33.0, 34.87], [36.0, 36.96], [38.0, 38.52], [39.0, 39.82], [41.0, 40.85], [45.0, 46.35], [48.0, 48.79], [52.0, 52.79], [54.0, 54.77], [56.0, 56.69], [57.0, 58.58], [61.0, 61.28], [62.0, 62.01], [65.0, 64.96], [66.0, 67.34], [68.0, 68.62], [74.0, 75.19], [81.0, 81.5], [84.0, 84.84], [87.0, 87.32], [91.0, 91.45], [92.0, 92.64], [95.0, 96.31], [98.0, 100.79], [105.0, 106.76], [107.0, 125.37], [126.0, 127.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 72.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 0.2, 0.8, 0.02, 0.32, 3.5, 0.43, 0.62, 5.36, 1.87, 0.96, 0.52, 0.82, -0.15, 1.35, 0.79, 0.79, 0.77, 0.69, 1.58, 0.28, 0.01, -0.04, 1.34, 0.62, 1.19, 0.5, 0.84, 0.32, 0.45, 0.64, 1.31, 2.79, 1.76, 18.37, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/iG4GVhx6oGc_filtered.json b/annotations_filtered/iG4GVhx6oGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb648ce7d1497317177fd14f2ec1369287a0c066 --- /dev/null +++ b/annotations_filtered/iG4GVhx6oGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [22.0, 25.32], [34.0, 34.69], [36.0, 37.77], [41.0, 41.45], [48.0, 49.15], [50.0, 50.4], [51.0, 52.02], [55.0, 57.08], [66.0, 67.29], [70.0, 70.92], [88.0, 87.94], [89.0, 89.7], [90.0, 92.38], [96.0, 96.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 3.32, 0.69, 1.77, 0.45, 1.15, 0.4, 1.02, 2.08, 1.29, 0.92, -0.06, 0.7, 2.38, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/iG5M3WSF1DY_filtered.json b/annotations_filtered/iG5M3WSF1DY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..797f90cdf0bdc7b5ba77212e26dedc333309397d --- /dev/null +++ b/annotations_filtered/iG5M3WSF1DY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [10.0, 10.62], [11.0, 17.54], [19.0, 20.02], [22.0, 26.13], [28.0, 29.08], [30.0, 32.1], [35.0, 40.85], [42.0, 43.85], [46.0, 47.51], [50.0, 66.77], [68.0, 71.09], [72.0, 73.03], [74.0, 76.18], [77.0, 77.95], [79.0, 80.54], [82.0, 88.97], [91.0, 91.45], [94.0, 95.23], [96.0, 99.22], [100.0, 101.53], [104.0, 110.44], [112.0, 112.5], [117.0, 145.99], [149.0, 150.42], [152.0, 153.45]], "keep_status": [false, false, true, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 34.16, 0.0, 35.57, 0.0, 35.26, 29.45, 0.0, 0.0, 40.48, 94.37, 0.0, 40.17, 0.0, 0.0, 61.18, 0.0, 0.0, 58.13, 0.0, 29.96, 0.0, 31.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 22.1], ["cattle, bovinae", 20.15], ["moo", 12.1]], null, [["hum", 46.99], ["mains hum", 25.02], ["throbbing", 19.48]], null, [["speech", 56.38], ["vehicle", 6.31], ["music", 2.62]], [["music", 21.47], ["speech", 16.82], ["whip", 6.23]], null, null, [["music", 45.09], ["hum", 9.03], ["throbbing", 4.82]], null, null, [["speech", 45.14], ["fart", 37.06], ["music", 2.04]], null, null, null, null, null, null, null, [["music", 31.17], ["speech", 25.55], ["theremin", 2.18]], null, [["music", 18.23], ["thump, thud", 7.1], ["whack, thwack", 6.4]], null, null], "duration": [1.17, 0.62, 6.54, 1.02, 4.13, 1.08, 2.1, 5.85, 1.85, 1.51, 16.77, 3.09, 1.03, 2.18, 0.95, 1.54, 6.97, 0.45, 1.23, 3.22, 1.53, 6.44, 0.5, 28.99, 1.42, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/iG5oSrAW9FQ_filtered.json b/annotations_filtered/iG5oSrAW9FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6376f3dcfc6762fc3390c6293bfda4f6bf7d999d --- /dev/null +++ b/annotations_filtered/iG5oSrAW9FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 46.45], [48.0, 90.14], [90.0, 92.5], [95.0, 107.38]], "keep_status": [true, false, false, true], "silence_prob": [30.4, 0.0, 30.75, 38.83], "audiomae_on_audioset": [[["music", 55.97], ["didgeridoo", 8.66], ["cattle, bovinae", 3.3]], null, [["speech", 59.65], ["buzzer", 14.96], ["music", 5.55]], [["cattle, bovinae", 18.97], ["moo", 14.52], ["sidetone", 10.94]]], "duration": [6.45, 42.14, 2.5, 12.38]} \ No newline at end of file diff --git a/annotations_filtered/iGIooJXEu9E_filtered.json b/annotations_filtered/iGIooJXEu9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f44e8e8170eaeb9294335343034543d3ab13cde --- /dev/null +++ b/annotations_filtered/iGIooJXEu9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [7.0, 8.51], [10.0, 10.66], [12.0, 12.51], [15.0, 16.21], [16.0, 17.34], [18.0, 18.35], [19.0, 24.46], [26.0, 26.81], [28.0, 29.96], [33.0, 33.07], [34.0, 34.72], [41.0, 41.79], [43.0, 43.31], [44.0, 47.01], [50.0, 53.72], [56.0, 57.79], [59.0, 60.02], [62.0, 62.97], [65.0, 70.56], [71.0, 73.47], [74.0, 74.87], [78.0, 77.99], [78.0, 78.78], [83.0, 82.66], [83.0, 84.87], [86.0, 86.09], [91.0, 92.85], [96.0, 97.02], [103.0, 103.49], [105.0, 105.71], [107.0, 108.36], [111.0, 111.28], [112.0, 112.92], [115.0, 118.79], [121.0, 121.71], [124.0, 126.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 96.66, 0.0, 0.0, 0.0, 34.94, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 0.0, 56.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 37.03], ["music", 25.71], ["stomach rumble", 9.07]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.25], ["electric shaver, electric razor", 31.32], ["buzz", 9.41]], [["music", 29.84], ["speech", 19.95], ["electric shaver, electric razor", 13.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.44], ["cattle, bovinae", 16.46], ["music", 13.11]], null, null], "duration": [1.97, 1.51, 0.66, 0.51, 1.21, 1.34, 0.35, 5.46, 0.81, 1.96, 0.07, 0.72, 0.79, 0.31, 3.01, 3.72, 1.79, 1.02, 0.97, 5.56, 2.47, 0.87, -0.01, 0.78, -0.34, 1.87, 0.09, 1.85, 1.02, 0.49, 0.71, 1.36, 0.28, 0.92, 3.79, 0.71, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/iGJCWeK7YCA_filtered.json b/annotations_filtered/iGJCWeK7YCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c2ea29826bfab7418e628b2a00b454e627edda --- /dev/null +++ b/annotations_filtered/iGJCWeK7YCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.02], [14.0, 16.16], [19.0, 19.58], [20.0, 20.82], [22.0, 23.62], [27.0, 38.75], [44.0, 46.4], [47.0, 48.93], [53.0, 55.93], [56.0, 58.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false], "silence_prob": [55.46, 43.23, 0.0, 0.0, 0.0, 38.03, 74.13, 0.0, 42.08, 34.65], "audiomae_on_audioset": [null, [["music", 43.94], ["musical instrument", 5.93], ["throbbing", 4.52]], null, null, null, [["music", 38.67], ["synthesizer", 20.96], ["musical instrument", 10.51]], null, null, [["music", 65.87], ["musical instrument", 3.63], ["electronic music", 3.61]], [["music", 58.38], ["speech", 9.22], ["electronic music", 4.29]]], "duration": [2.02, 2.16, 0.58, 0.82, 1.62, 11.75, 2.4, 1.93, 2.93, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/iGVsptoMsKE_filtered.json b/annotations_filtered/iGVsptoMsKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68232e726d5d899036be4b5d37c4879672d0aa72 --- /dev/null +++ b/annotations_filtered/iGVsptoMsKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.59], [14.0, 14.67], [19.0, 31.35], [34.0, 43.11], [44.0, 44.74], [46.0, 94.96], [97.0, 105.93], [107.0, 107.43], [110.0, 110.74], [111.0, 112.97], [118.0, 118.15], [118.0, 119.37], [122.0, 129.84], [131.0, 142.26], [154.0, 154.99], [160.0, 160.79], [166.0, 175.05]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.73, 36.98, 0.0, 0.0, 30.01, 0.0, 0.0, 0.0, 0.0, 0.0, 30.04, 30.4, 0.0, 0.0, 31.7], "audiomae_on_audioset": [null, null, [["music", 48.66], ["fart", 7.24], ["hum", 5.22]], [["music", 71.57], ["wild animals", 7.95], ["animal", 4.3]], null, null, [["music", 43.11], ["hum", 12.51], ["theremin", 6.59]], null, null, null, null, null, [["music", 43.19], ["theremin", 35.74], ["speech", 2.43]], [["music", 61.32], ["theremin", 21.29], ["ambient music", 1.49]], null, null, [["music", 25.53], ["speech", 22.45], ["theremin", 9.75]]], "duration": [1.59, 0.67, 12.35, 9.11, 0.74, 48.96, 8.93, 0.43, 0.74, 1.97, 0.15, 1.37, 7.84, 11.26, 0.99, 0.79, 9.05]} \ No newline at end of file diff --git a/annotations_filtered/iGawlpfe6a0_filtered.json b/annotations_filtered/iGawlpfe6a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73e4503191192b610f172ad6deafa863f46f66f9 --- /dev/null +++ b/annotations_filtered/iGawlpfe6a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 53.28], [66.0, 67.27], [84.0, 83.71], [87.0, 87.13], [88.0, 87.98]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.28, 1.27, -0.29, 0.13, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/iGhEOyypT2A_filtered.json b/annotations_filtered/iGhEOyypT2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9fb57b1a6a1458a310c2857180691a5577bd17e --- /dev/null +++ b/annotations_filtered/iGhEOyypT2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 23.84], [25.0, 36.73], [40.0, 40.78], [44.0, 44.73], [54.0, 54.62], [60.0, 60.39], [62.0, 66.61], [67.0, 67.61], [68.0, 72.44]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.64, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 72.31], "audiomae_on_audioset": [null, [["theremin", 36.06], ["music", 34.9], ["noise", 5.52]], null, null, null, null, [["wild animals", 61.12], ["animal", 13.89], ["roaring cats (lions, tigers)", 12.35]], null, null], "duration": [-0.16, 11.73, 0.78, 0.73, 0.62, 0.39, 4.61, 0.61, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/iGk7QYThMTk_filtered.json b/annotations_filtered/iGk7QYThMTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f74fa908bc549397220eb4f699f972e55596d4d --- /dev/null +++ b/annotations_filtered/iGk7QYThMTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 34.38], [35.0, 36.07], [38.0, 71.15], [72.0, 88.05], [88.0, 118.0], [120.0, 143.94], [145.0, 144.96], [145.0, 145.25], [146.0, 151.34], [151.0, 151.38], [152.0, 161.65], [164.0, 168.12]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [39.54, 0.0, 0.0, 30.31, 29.42, 30.42, 0.0, 0.0, 30.94, 0.0, 29.72, 36.16], "audiomae_on_audioset": [[["music", 31.51], ["effects unit", 5.94], ["frog", 3.93]], null, null, [["music", 75.01], ["mains hum", 7.01], ["hum", 6.95]], [["music", 50.79], ["speech", 13.39], ["fireworks", 6.89]], [["music", 57.44], ["effects unit", 7.16], ["musical instrument", 6.24]], null, null, [["music", 61.86], ["mains hum", 3.93], ["hum", 3.51]], null, [["music", 55.59], ["speech", 9.44], ["buzz", 4.53]], [["speech", 44.88], ["music", 11.06], ["fly, housefly", 4.08]]], "duration": [2.38, 1.07, 33.15, 16.05, 30.0, 23.94, -0.04, 0.25, 5.34, 0.38, 9.65, 4.12]} \ No newline at end of file diff --git a/annotations_filtered/iGsce-w4TtY_filtered.json b/annotations_filtered/iGsce-w4TtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd9c10694396ec5705593091630c9c77f50f531 --- /dev/null +++ b/annotations_filtered/iGsce-w4TtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.99], [17.0, 36.36], [39.0, 40.05], [41.0, 43.65], [45.0, 61.35], [65.0, 83.07], [84.0, 84.43], [85.0, 92.75], [94.0, 97.53], [100.0, 109.65], [110.0, 110.27], [110.0, 110.79], [111.0, 125.9]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [30.21, 30.83, 0.0, 31.07, 30.23, 30.99, 0.0, 30.05, 29.97, 30.89, 0.0, 0.0, 29.16], "audiomae_on_audioset": [[["cattle, bovinae", 30.26], ["moo", 20.86], ["livestock, farm animals, working animals", 19.28]], [["cattle, bovinae", 58.38], ["moo", 23.1], ["livestock, farm animals, working animals", 15.53]], null, [["music", 34.59], ["speech", 34.37], ["electronic music", 4.24]], [["speech", 32.31], ["explosion", 14.52], ["whack, thwack", 5.86]], [["speech", 43.59], ["fart", 32.67], ["music", 5.16]], null, [["explosion", 39.01], ["speech", 25.4], ["eruption", 8.03]], [["speech", 26.47], ["fart", 24.86], ["explosion", 19.57]], [["hum", 21.05], ["rumble", 10.63], ["speech", 8.85]], null, null, [["grunt", 11.85], ["music", 8.36], ["hum", 6.14]]], "duration": [2.99, 19.36, 1.05, 2.65, 16.35, 18.07, 0.43, 7.75, 3.53, 9.65, 0.27, 0.79, 14.9]} \ No newline at end of file diff --git a/annotations_filtered/iH9hjyoAugw_filtered.json b/annotations_filtered/iH9hjyoAugw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88a1af39f03f95cdbaa846568b4fd6a29ab2f5b9 --- /dev/null +++ b/annotations_filtered/iH9hjyoAugw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [6.0, 8.09], [8.0, 8.78], [9.0, 11.1], [12.0, 16.23], [19.0, 21.15], [23.0, 22.92], [24.0, 24.93], [26.0, 28.12], [30.0, 46.74], [48.0, 54.63], [56.0, 89.18], [90.0, 92.74], [94.0, 96.31], [96.0, 96.4], [97.0, 97.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.16, 100.0, 0.0, 100.0, 100.0, 82.79, 0.0, 0.0, 99.99, 98.44, 64.29, 0.0, 69.47, 62.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 2.09, 0.78, 2.1, 4.23, 2.15, -0.08, 0.93, 2.12, 16.74, 6.63, 33.18, 2.74, 2.31, 0.4, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/iHQZhYadNwQ_filtered.json b/annotations_filtered/iHQZhYadNwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47e6cf46920bcdcf19f687b243661b9ac9f0d37a --- /dev/null +++ b/annotations_filtered/iHQZhYadNwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 27.57], [28.0, 58.7], [62.0, 65.33], [66.0, 67.1], [68.0, 73.45], [74.0, 76.35], [77.0, 79.57], [80.0, 83.12], [84.0, 91.37], [93.0, 99.81], [101.0, 103.6], [106.0, 111.47], [113.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.38, 0.0, 75.39, 0.0, 94.52, 96.66, 93.91, 93.91, 85.72, 96.29, 96.66, 82.07, 66.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.57, 30.7, 3.33, 1.1, 5.45, 2.35, 2.57, 3.12, 7.37, 6.81, 2.6, 5.47, 20.1]} \ No newline at end of file diff --git a/annotations_filtered/iHWOj17ISfk_filtered.json b/annotations_filtered/iHWOj17ISfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a155fd8d2e053972da90b35b3398811f027d391b --- /dev/null +++ b/annotations_filtered/iHWOj17ISfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.3], [16.0, 17.02], [18.0, 18.52], [28.0, 37.88], [44.0, 45.12], [46.0, 48.9], [49.0, 55.09], [62.0, 78.81], [80.0, 100.03], [103.0, 111.37]], "keep_status": [false, false, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 59.77, 0.0, 42.13, 54.04, 43.35, 31.59, 32.51], "audiomae_on_audioset": [null, null, null, null, null, [["music", 38.39], ["speech", 17.88], ["sneeze", 3.18]], null, [["speech", 33.46], ["music", 17.86], ["hum", 6.35]], [["glass", 12.96], ["siren", 10.56], ["breaking", 10.42]], [["music", 24.8], ["speech", 6.41], ["chink, clink", 6.18]]], "duration": [0.3, 1.02, 0.52, 9.88, 1.12, 2.9, 6.09, 16.81, 20.03, 8.37]} \ No newline at end of file diff --git a/annotations_filtered/iHheroBxkuE_filtered.json b/annotations_filtered/iHheroBxkuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0f04d16f78ac5ba3c10f19a0e38b52a24ef03c6 --- /dev/null +++ b/annotations_filtered/iHheroBxkuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.95], [5.0, 5.09], [7.0, 7.77], [8.0, 8.72], [10.0, 10.56], [18.0, 17.88], [19.0, 33.2], [34.0, 33.93], [38.0, 39.36], [48.0, 48.98], [49.0, 50.36], [56.0, 55.88], [65.0, 65.15], [72.0, 75.68], [88.0, 89.26], [94.0, 96.5], [100.0, 100.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.95, 0.09, 0.77, 0.72, 0.56, -0.12, 14.2, -0.07, 1.36, 0.98, 1.36, -0.12, 0.15, 3.68, 1.26, 2.5, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/iHllnWESLvY_filtered.json b/annotations_filtered/iHllnWESLvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5dfd0a511bc04b3c79c817251ea1854e5475b87 --- /dev/null +++ b/annotations_filtered/iHllnWESLvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.79], [3.0, 3.55], [5.0, 6.69], [8.0, 8.75], [10.0, 16.39], [18.0, 20.28], [21.0, 21.05], [32.0, 32.17], [34.0, 33.88], [35.0, 35.65], [42.0, 43.98], [45.0, 57.96], [58.0, 58.72], [61.0, 61.06], [62.0, 62.29], [65.0, 65.64], [66.0, 67.66], [68.0, 87.05], [92.0, 93.38], [94.0, 96.89], [99.0, 99.99], [101.0, 103.08], [105.0, 111.81], [112.0, 114.81], [116.0, 119.16], [121.0, 121.78], [123.0, 124.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.55, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 44.99, 0.0, 85.17, 0.0, 99.44, 99.16, 92.48, 97.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.48], ["synthesizer", 6.85], ["gong", 4.84]], null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.55, 1.69, 0.75, 6.39, 2.28, 0.05, 0.17, -0.12, 0.65, 1.98, 12.96, 0.72, 0.06, 0.29, 0.64, 1.66, 19.05, 1.38, 2.89, 0.99, 2.08, 6.81, 2.81, 3.16, 0.78, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/iI0hgr8Kff8_filtered.json b/annotations_filtered/iI0hgr8Kff8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9ed66c565a87a2543bc91b5b4b4813635107ad7 --- /dev/null +++ b/annotations_filtered/iI0hgr8Kff8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [6.0, 8.46]], "keep_status": [false, true], "silence_prob": [0.0, 46.43], "audiomae_on_audioset": [null, [["music", 44.56], ["speech", 9.5], ["didgeridoo", 4.87]]], "duration": [0.57, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/iI8w5AQJcN8_filtered.json b/annotations_filtered/iI8w5AQJcN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e163ea64771c72458f6661f0c9dd5b221f9588e --- /dev/null +++ b/annotations_filtered/iI8w5AQJcN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 5.27], [7.0, 8.73], [11.0, 11.03], [12.0, 13.36], [14.0, 14.61], [15.0, 18.22], [19.0, 19.63], [21.0, 61.08], [63.0, 63.36], [64.0, 65.62], [68.0, 69.7], [71.0, 73.01], [74.0, 83.79], [85.0, 88.72], [90.0, 90.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 0.0, 41.1, 45.08, 55.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.83], ["speech", 11.6], ["musical instrument", 7.89]], [["music", 42.43], ["theremin", 13.09], ["musical instrument", 9.34]], null, null], "duration": [1.0, 1.27, 1.73, 0.03, 1.36, 0.61, 3.22, 0.63, 40.08, 0.36, 1.62, 1.7, 2.01, 9.79, 3.72, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/iIUzHUOdLhM_filtered.json b/annotations_filtered/iIUzHUOdLhM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d34b7d1a1f09c01979a162e1df96ea01a4543825 --- /dev/null +++ b/annotations_filtered/iIUzHUOdLhM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 39.53], [41.0, 41.91], [50.0, 50.04], [58.0, 66.16], [71.0, 71.17], [75.0, 77.16], [78.0, 78.73], [80.0, 81.46], [82.0, 83.35], [84.0, 84.42], [91.0, 92.03], [104.0, 104.72], [107.0, 117.26], [117.0, 120.16], [122.0, 122.34], [123.0, 123.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.54, 0.0, 0.0, 76.04, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 84.07, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.51], ["percussion", 13.42], ["hum", 7.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.53, 0.91, 0.04, 8.16, 0.17, 2.16, 0.73, 1.46, 1.35, 0.42, 1.03, 0.72, 10.26, 3.16, 0.34, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/iIeyS_5sJHE_filtered.json b/annotations_filtered/iIeyS_5sJHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ce4ab89a0fe50d52ae0a9e2a7855a969899f816 --- /dev/null +++ b/annotations_filtered/iIeyS_5sJHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.56], [18.0, 22.65], [25.0, 50.65], [59.0, 89.61], [92.0, 98.58], [102.0, 102.15]], "keep_status": [true, false, false, false, false, false], "silence_prob": [32.25, 31.37, 30.3, 0.0, 31.86, 0.0], "audiomae_on_audioset": [[["music", 37.74], ["speech", 14.31], ["livestock, farm animals, working animals", 13.99]], [["speech", 57.42], ["music", 17.09], ["vehicle", 4.1]], [["music", 36.11], ["speech", 33.77], ["cacophony", 6.02]], null, [["speech", 70.25], ["music", 8.26], ["explosion", 2.85]], null], "duration": [9.56, 4.65, 25.65, 30.61, 6.58, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/iJDnG2RAlzk_filtered.json b/annotations_filtered/iJDnG2RAlzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab9c04ce9deaeb35607de7a4d45861294715b2ec --- /dev/null +++ b/annotations_filtered/iJDnG2RAlzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.33], [16.0, 16.92], [21.0, 20.63], [21.0, 30.25], [31.0, 59.93], [61.0, 71.46], [72.0, 73.35], [74.0, 76.69], [79.0, 80.45], [82.0, 83.4], [84.0, 85.99], [87.0, 95.1]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.52, 31.67, 30.88, 0.0, 40.71, 0.0, 0.0, 0.0, 32.2], "audiomae_on_audioset": [null, null, null, [["speech", 49.88], ["sidetone", 13.96], ["electric shaver, electric razor", 11.86]], [["livestock, farm animals, working animals", 30.08], ["cattle, bovinae", 19.19], ["moo", 17.59]], [["speech", 28.08], ["music", 8.45], ["fly, housefly", 8.26]], null, [["whale vocalization", 38.83], ["speech", 33.58], ["music", 3.42]], null, null, null, [["speech", 45.84], ["explosion", 12.3], ["rumble", 7.59]]], "duration": [0.33, 0.92, -0.37, 9.25, 28.93, 10.46, 1.35, 2.69, 1.45, 1.4, 1.99, 8.1]} \ No newline at end of file diff --git a/annotations_filtered/iJGazi2EdrQ_filtered.json b/annotations_filtered/iJGazi2EdrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..172fdc62f6b87303566499b7b7c4e8842f1972f6 --- /dev/null +++ b/annotations_filtered/iJGazi2EdrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 6.49], [7.0, 8.34], [9.0, 9.1], [11.0, 11.25], [14.0, 15.26], [16.0, 16.51], [19.0, 19.36], [21.0, 23.62], [25.0, 30.57], [32.0, 75.46], [77.0, 84.59], [85.0, 99.3], [102.0, 107.13], [107.0, 111.6], [113.0, 116.72], [120.0, 120.6], [122.0, 124.44], [125.0, 135.14], [136.0, 141.35], [142.0, 144.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.16, 0.0, 98.44, 83.16, 94.66, 83.7, 85.72, 0.0, 95.37, 72.75, 81.53, 56.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.49, 1.34, 0.1, 0.25, 1.26, 0.51, 0.36, 2.62, 5.57, 43.46, 7.59, 14.3, 5.13, 4.6, 3.72, 0.6, 2.44, 10.14, 5.35, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/iJHyw2pjpWA_filtered.json b/annotations_filtered/iJHyw2pjpWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..174565124e9f011aed63b9c24e10b18dd3ce70bc --- /dev/null +++ b/annotations_filtered/iJHyw2pjpWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.55], [20.0, 20.44], [23.0, 23.94], [26.0, 26.16], [33.0, 34.11], [37.0, 41.44], [42.0, 43.44], [57.0, 63.02], [66.0, 72.28], [85.0, 85.58], [86.0, 86.26], [93.0, 94.8], [95.0, 96.65], [100.0, 117.73], [126.0, 127.26], [128.0, 129.56], [130.0, 132.76], [137.0, 137.46], [141.0, 146.01], [155.0, 156.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.33, 0.0, 30.77, 32.22, 0.0, 0.0, 0.0, 0.0, 30.24, 0.0, 0.0, 39.01, 0.0, 31.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 60.03], ["speech", 18.55], ["musical instrument", 1.47]], null, [["speech", 34.52], ["hum", 12.47], ["buzz", 12.3]], [["throbbing", 37.84], ["music", 32.03], ["hum", 9.62]], null, null, null, null, [["music", 56.06], ["buzz", 7.88], ["throbbing", 5.94]], null, null, [["speech", 37.87], ["music", 22.91], ["fart", 4.86]], null, [["speech", 53.34], ["music", 7.63], ["moo", 6.64]], null], "duration": [1.55, 0.44, 0.94, 0.16, 1.11, 4.44, 1.44, 6.02, 6.28, 0.58, 0.26, 1.8, 1.65, 17.73, 1.26, 1.56, 2.76, 0.46, 5.01, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/iJKQl3uGg0I_filtered.json b/annotations_filtered/iJKQl3uGg0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26928dc7bd547ec40cd1c0a157d433fb2c09281b --- /dev/null +++ b/annotations_filtered/iJKQl3uGg0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [3.0, 4.13], [6.0, 7.11], [8.0, 9.53], [10.0, 11.31], [12.0, 12.78], [14.0, 18.35], [20.0, 20.68], [25.0, 25.88], [27.0, 28.44], [29.0, 29.42], [31.0, 33.32], [34.0, 34.55], [37.0, 43.5], [45.0, 45.64], [50.0, 50.79], [52.0, 56.27], [59.0, 59.24], [62.0, 63.02], [65.0, 65.08], [66.0, 67.69], [69.0, 69.31], [70.0, 71.36], [73.0, 74.14], [76.0, 77.85], [80.0, 80.86], [82.0, 83.12], [84.0, 85.63], [87.0, 87.24], [88.0, 99.22], [101.0, 102.12], [103.0, 103.87], [104.0, 107.4], [110.0, 110.37], [120.0, 121.68], [123.0, 123.96], [125.0, 125.83], [129.0, 129.02], [130.0, 131.46], [133.0, 132.87], [137.0, 139.14], [142.0, 143.29], [145.0, 145.32], [146.0, 146.48], [148.0, 149.23], [150.0, 151.43], [153.0, 154.14], [155.0, 156.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.96, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 37.21, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 63.58], ["hum", 4.11], ["radio", 3.43]], null, null, null, null, null, null, [["music", 17.13], ["fart", 14.13], ["speech", 10.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.13, 1.11, 1.53, 1.31, 0.78, 4.35, 0.68, 0.88, 1.44, 0.42, 2.32, 0.55, 6.5, 0.64, 0.79, 4.27, 0.24, 1.02, 0.08, 1.69, 0.31, 1.36, 1.14, 1.85, 0.86, 1.12, 1.63, 0.24, 11.22, 1.12, 0.87, 3.4, 0.37, 1.68, 0.96, 0.83, 0.02, 1.46, -0.13, 2.14, 1.29, 0.32, 0.48, 1.23, 1.43, 1.14, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/iJKhynhnPyU_filtered.json b/annotations_filtered/iJKhynhnPyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b7211222819d97e89a3317b0a1ab5e0f89e05b --- /dev/null +++ b/annotations_filtered/iJKhynhnPyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.82], [11.0, 11.74], [19.0, 19.25], [32.0, 31.89], [47.0, 47.34], [54.0, 54.3], [62.0, 62.45], [64.0, 63.88], [65.0, 66.09], [67.0, 70.63], [73.0, 76.65], [78.0, 78.88], [80.0, 81.6], [83.0, 84.79], [88.0, 88.57], [96.0, 96.06], [99.0, 99.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.82, 0.74, 0.25, -0.11, 0.34, 0.3, 0.45, -0.12, 1.09, 3.63, 3.65, 0.88, 1.6, 1.79, 0.57, 0.06, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/iJMYIXoFGcQ_filtered.json b/annotations_filtered/iJMYIXoFGcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b826b96b195f116739e5a34b15501b6f6712164 --- /dev/null +++ b/annotations_filtered/iJMYIXoFGcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [4.0, 4.99], [7.0, 8.02], [9.0, 10.94], [12.0, 12.77], [15.0, 15.82], [23.0, 22.94], [23.0, 27.63], [31.0, 33.32], [36.0, 37.44], [39.0, 39.06], [48.0, 48.49], [51.0, 52.93], [62.0, 63.85], [81.0, 81.94], [92.0, 93.6], [95.0, 95.4], [100.0, 101.07], [102.0, 102.56], [104.0, 105.26], [108.0, 108.26], [111.0, 111.13], [112.0, 112.4], [117.0, 118.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.48, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 50.4], ["musical instrument", 8.5], ["cello", 4.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.99, 1.02, 1.94, 0.77, 0.82, -0.06, 4.63, 2.32, 1.44, 0.06, 0.49, 1.93, 1.85, 0.94, 1.6, 0.4, 1.07, 0.56, 1.26, 0.26, 0.13, 0.4, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/iJ_DrM05hp4_filtered.json b/annotations_filtered/iJ_DrM05hp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf10cda20fe0ab35244e0c8731e1773ade72b6a2 --- /dev/null +++ b/annotations_filtered/iJ_DrM05hp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.19], [9.0, 9.54], [15.0, 15.31], [17.0, 17.51], [24.0, 26.05], [29.0, 30.0], [35.0, 35.56], [37.0, 37.66], [41.0, 41.05], [44.0, 44.24], [50.0, 50.9], [54.0, 53.7], [60.0, 61.8], [89.0, 89.55], [90.0, 91.1], [92.0, 92.38], [122.0, 123.09], [140.0, 140.29], [145.0, 145.47], [147.0, 148.26], [150.0, 150.47], [154.0, 155.01], [162.0, 162.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.54, 0.31, 0.51, 2.05, 1.0, 0.56, 0.66, 0.05, 0.24, 0.9, -0.3, 1.8, 0.55, 1.1, 0.38, 1.09, 0.29, 0.47, 1.26, 0.47, 1.01, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/iJcH2hCMNiY_filtered.json b/annotations_filtered/iJcH2hCMNiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bde9d31ba2f168b9906d6d47841bed1ab0e2fb31 --- /dev/null +++ b/annotations_filtered/iJcH2hCMNiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [8.0, 8.24], [11.0, 11.13], [18.0, 19.2], [19.0, 22.18], [33.0, 33.07], [35.0, 35.51], [45.0, 45.77], [48.0, 48.76], [50.0, 50.79], [55.0, 55.9], [63.0, 63.15], [66.0, 67.02], [68.0, 68.5], [73.0, 76.94], [78.0, 78.93], [80.0, 80.62], [82.0, 83.91], [86.0, 85.95], [95.0, 95.5], [98.0, 98.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 0.24, 0.13, 1.2, 3.18, 0.07, 0.51, 0.77, 0.76, 0.79, 0.9, 0.15, 1.02, 0.5, 3.94, 0.93, 0.62, 1.91, -0.05, 0.5, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/iJrgXYnUVe8_filtered.json b/annotations_filtered/iJrgXYnUVe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d95d6c089f27f0010d0e6f69c5efe411cf8a60ab --- /dev/null +++ b/annotations_filtered/iJrgXYnUVe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.35], [29.0, 30.54], [33.0, 33.81], [37.0, 39.29], [41.0, 41.2], [42.0, 79.69], [82.0, 82.56], [88.0, 87.72], [93.0, 95.01], [96.0, 98.27], [102.0, 102.86], [104.0, 104.77], [114.0, 118.02], [120.0, 124.28], [126.0, 128.68]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [30.94, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 0.0, 100.0, 94.52, 0.0, 0.0, 30.83, 30.21, 32.64], "audiomae_on_audioset": [[["hum", 46.47], ["throbbing", 43.11], ["music", 6.14]], null, null, [["music", 19.19], ["hum", 14.31], ["rumble", 7.31]], null, null, null, null, null, null, null, null, [["boom", 24.09], ["whack, thwack", 9.47], ["explosion", 9.43]], [["speech", 30.7], ["boing", 21.92], ["music", 11.72]], [["music", 41.53], ["boing", 21.77], ["speech", 5.51]]], "duration": [17.35, 1.54, 0.81, 2.29, 0.2, 37.69, 0.56, -0.28, 2.01, 2.27, 0.86, 0.77, 4.02, 4.28, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/iK0-76FChfk_filtered.json b/annotations_filtered/iK0-76FChfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc10ac998194dfa331c3a1b019780221aed7c387 --- /dev/null +++ b/annotations_filtered/iK0-76FChfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.78], [9.0, 10.35], [11.0, 12.73], [13.0, 16.88], [18.0, 20.71], [24.0, 26.13], [26.0, 30.96], [32.0, 33.32], [39.0, 53.0], [64.0, 64.07], [65.0, 77.41], [79.0, 79.14], [82.0, 81.97], [83.0, 85.95], [86.0, 95.23], [101.0, 103.2], [105.0, 112.58], [118.0, 119.33], [122.0, 122.23], [126.0, 125.88], [127.0, 128.53], [130.0, 131.3], [133.0, 134.91], [136.0, 137.94], [141.0, 142.13], [144.0, 148.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [52.45, 0.0, 0.0, 53.91, 91.3, 99.16, 70.3, 0.0, 91.3, 0.0, 34.22, 0.0, 0.0, 30.5, 40.7, 85.54, 39.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 42.35], ["sidetone", 17.65], ["music", 14.73]], null, null, [["speech", 34.64], ["didgeridoo", 16.28], ["music", 9.95]], [["music", 27.33], ["speech", 21.86], ["throbbing", 10.13]], null, [["speech", 40.86], ["explosion", 20.57], ["burst, pop", 6.17]], null, null, null, null, null, null, null, null, null], "duration": [3.78, 1.35, 1.73, 3.88, 2.71, 2.13, 4.96, 1.32, 14.0, 0.07, 12.41, 0.14, -0.03, 2.95, 9.23, 2.2, 7.58, 1.33, 0.23, -0.12, 1.53, 1.3, 1.91, 1.94, 1.13, 4.02]} \ No newline at end of file diff --git a/annotations_filtered/iK03b228mmo_filtered.json b/annotations_filtered/iK03b228mmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f73cf951c694189ff4769083751fa7fc2952c41e --- /dev/null +++ b/annotations_filtered/iK03b228mmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.85], [11.0, 17.74], [18.0, 19.63], [22.0, 25.62], [27.0, 29.37], [31.0, 32.04], [33.0, 39.68], [40.0, 41.13], [43.0, 44.2], [45.0, 54.51], [55.0, 55.9], [56.0, 68.79], [70.0, 86.02], [89.0, 90.24], [94.0, 110.94], [117.0, 118.56], [122.0, 125.44], [131.0, 130.87], [132.0, 140.09], [142.0, 152.68], [157.0, 166.24]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [29.13, 29.07, 0.0, 30.24, 32.05, 0.0, 30.73, 0.0, 0.0, 30.33, 0.0, 30.85, 29.43, 0.0, 31.63, 0.0, 32.77, 0.0, 36.35, 34.66, 35.37], "audiomae_on_audioset": [[["music", 47.5], ["hum", 8.65], ["throbbing", 8.04]], [["music", 30.56], ["hum", 13.73], ["throbbing", 12.16]], null, [["music", 21.14], ["hum", 17.92], ["throbbing", 7.06]], [["music", 46.54], ["hum", 11.33], ["throbbing", 8.23]], null, [["music", 31.96], ["hum", 22.62], ["speech", 18.78]], null, null, [["speech", 34.61], ["hum", 20.0], ["music", 18.54]], null, [["didgeridoo", 72.48], ["music", 11.04], ["gong", 2.44]], [["hum", 29.3], ["didgeridoo", 23.52], ["music", 19.48]], null, [["music", 45.04], ["hum", 27.01], ["throbbing", 9.71]], null, [["music", 35.98], ["hum", 7.37], ["speech", 6.82]], null, [["hum", 33.84], ["mains hum", 23.41], ["music", 20.84]], [["mains hum", 34.7], ["hum", 19.0], ["speech", 8.17]], [["music", 25.51], ["mains hum", 14.37], ["hum", 8.57]]], "duration": [5.85, 6.74, 1.63, 3.62, 2.37, 1.04, 6.68, 1.13, 1.2, 9.51, 0.9, 12.79, 16.02, 1.24, 16.94, 1.56, 3.44, -0.13, 8.09, 10.68, 9.24]} \ No newline at end of file diff --git a/annotations_filtered/iK6cDwd3yH4_filtered.json b/annotations_filtered/iK6cDwd3yH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5fa83eef93a4ee73e9114dbde758c5e87dc6c63 --- /dev/null +++ b/annotations_filtered/iK6cDwd3yH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [2.0, 2.37], [5.0, 5.41], [7.0, 7.99], [9.0, 10.52], [15.0, 15.3], [24.0, 24.49], [32.0, 33.88], [40.0, 40.73], [42.0, 42.72], [47.0, 48.34], [54.0, 54.95], [64.0, 64.88], [70.0, 70.92], [74.0, 81.51], [84.0, 85.18], [89.0, 91.39], [92.0, 97.12], [99.0, 99.28], [100.0, 100.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 99.16, 72.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.42], ["speech", 9.02], ["groan", 7.57]], null, null, null, null, null], "duration": [0.32, 0.37, 0.41, 0.99, 1.52, 0.3, 0.49, 1.88, 0.73, 0.72, 1.34, 0.95, 0.88, 0.92, 7.51, 1.18, 2.39, 5.12, 0.28, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/iKRpMjVJKZc_filtered.json b/annotations_filtered/iKRpMjVJKZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f0fc91a0d223c0eb66cb62a86457d13eb46ae1f --- /dev/null +++ b/annotations_filtered/iKRpMjVJKZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [12.0, 12.16], [16.0, 16.34], [19.0, 20.38], [23.0, 24.09], [25.0, 25.42], [27.0, 27.8], [29.0, 29.51], [36.0, 36.58], [42.0, 45.27], [49.0, 48.64], [50.0, 50.77], [52.0, 53.87], [55.0, 55.66], [60.0, 60.03], [64.0, 64.5], [65.0, 66.18], [67.0, 68.32], [77.0, 79.79], [81.0, 81.53], [83.0, 84.5], [97.0, 97.38], [99.0, 99.59], [100.0, 103.42], [105.0, 118.12], [123.0, 125.59], [135.0, 151.7], [154.0, 154.55], [156.0, 161.45], [163.0, 170.16], [172.0, 175.85], [177.0, 177.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 30.72, 32.46, 39.44, 30.42, 0.0, 32.15, 33.92, 39.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.17], ["frog", 15.14], ["sidetone", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 23.99], ["cattle, bovinae", 22.16], ["music", 15.88]], [["music", 53.39], ["electronic music", 6.27], ["techno", 5.91]], [["fly, housefly", 25.48], ["insect", 14.55], ["music", 11.41]], [["music", 46.82], ["speech", 10.53], ["theremin", 3.96]], null, [["music", 63.06], ["trance music", 7.07], ["speech", 5.71]], [["music", 45.01], ["sidetone", 30.87], ["speech", 9.5]], [["music", 28.33], ["speech", 17.68], ["fly, housefly", 9.37]], null], "duration": [0.73, 0.16, 0.34, 1.38, 1.09, 0.42, 0.8, 0.51, 0.58, 3.27, -0.36, 0.77, 1.87, 0.66, 0.03, 0.5, 1.18, 1.32, 2.79, 0.53, 1.5, 0.38, 0.59, 3.42, 13.12, 2.59, 16.7, 0.55, 5.45, 7.16, 3.85, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/iKS_327EF84_filtered.json b/annotations_filtered/iKS_327EF84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c05d7f2a37cb41e5fa3dc55572db75f139090c01 --- /dev/null +++ b/annotations_filtered/iKS_327EF84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.7], [15.0, 16.11], [17.0, 20.14], [21.0, 25.46], [30.0, 31.94], [33.0, 40.63], [47.0, 49.37], [66.0, 71.71], [82.0, 84.62], [86.0, 87.72], [90.0, 96.09], [99.0, 101.09], [110.0, 116.95], [125.0, 168.98], [173.0, 174.09], [174.0, 174.24], [177.0, 176.89]], "keep_status": [false, false, true, true, false, true, true, true, true, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 32.08, 30.08, 0.0, 29.25, 31.32, 29.91, 33.34, 0.0, 31.36, 30.68, 30.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 31.67], ["music", 27.9], ["speech", 6.95]], [["speech", 35.46], ["music", 24.92], ["electronic music", 6.76]], null, [["music", 24.12], ["electronic music", 16.81], ["speech", 9.92]], [["music", 29.05], ["throbbing", 19.26], ["hum", 7.23]], [["music", 24.72], ["throbbing", 13.05], ["hum", 7.24]], [["fly, housefly", 20.14], ["mosquito", 16.67], ["groan", 11.6]], null, [["music", 60.43], ["didgeridoo", 3.97], ["throbbing", 2.8]], [["speech", 32.47], ["music", 17.61], ["outside, urban or manmade", 3.71]], [["buzz", 31.55], ["fly, housefly", 12.15], ["mosquito", 12.15]], null, null, null, null], "duration": [1.7, 1.11, 3.14, 4.46, 1.94, 7.63, 2.37, 5.71, 2.62, 1.72, 6.09, 2.09, 6.95, 43.98, 1.09, 0.24, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/iKduvC0uNs8_filtered.json b/annotations_filtered/iKduvC0uNs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dce2d841152e643e2e96d88d3c3a3b1a6bacb455 --- /dev/null +++ b/annotations_filtered/iKduvC0uNs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 61.8], [62.0, 73.55], [78.0, 80.79], [82.0, 101.44], [104.0, 110.1], [115.0, 123.31], [123.0, 137.35], [140.0, 142.11], [145.0, 150.87], [152.0, 152.31]], "keep_status": [false, false, true, false, false, false, true, false, false, false], "silence_prob": [35.8, 32.23, 29.51, 29.02, 28.78, 29.04, 29.01, 55.74, 48.69, 0.0], "audiomae_on_audioset": [[["music", 53.32], ["mains hum", 21.54], ["hum", 15.75]], [["music", 66.64], ["didgeridoo", 6.62], ["throbbing", 3.27]], [["music", 33.88], ["shofar", 15.88], ["wind instrument, woodwind instrument", 4.61]], [["music", 72.05], ["synthesizer", 6.48], ["musical instrument", 3.69]], [["music", 71.57], ["musical instrument", 3.08], ["vehicle", 2.23]], [["music", 52.55], ["theremin", 15.68], ["speech", 2.88]], [["music", 21.94], ["wind instrument, woodwind instrument", 15.07], ["shofar", 8.64]], null, [["music", 42.94], ["didgeridoo", 27.73], ["musical instrument", 3.78]], null], "duration": [13.8, 11.55, 2.79, 19.44, 6.1, 8.31, 14.35, 2.11, 5.87, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/iKi2wYZNAnE_filtered.json b/annotations_filtered/iKi2wYZNAnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80f724378da20af00726f9443c8af7a66f553f68 --- /dev/null +++ b/annotations_filtered/iKi2wYZNAnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [12.0, 13.83], [19.0, 20.19], [23.0, 26.45], [30.0, 32.54], [34.0, 34.89], [39.0, 39.51], [48.0, 51.34], [52.0, 53.52], [54.0, 54.5], [55.0, 56.17], [67.0, 66.97], [69.0, 69.5], [79.0, 80.13], [81.0, 81.5], [82.0, 83.39], [103.0, 103.94], [113.0, 113.68]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.39, 41.64, 0.0, 0.0, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 20.12], ["livestock, farm animals, working animals", 19.33], ["cattle, bovinae", 17.62]], [["speech", 15.41], ["mains hum", 7.01], ["moo", 5.41]], null, null, [["music", 37.76], ["didgeridoo", 14.12], ["speech", 8.97]], null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.83, 1.19, 3.45, 2.54, 0.89, 0.51, 3.34, 1.52, 0.5, 1.17, -0.03, 0.5, 1.13, 0.5, 1.39, 0.94, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/iKp5ARBBpyc_filtered.json b/annotations_filtered/iKp5ARBBpyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c076a4e2faa8ab99f6af5bf55b3634a086793851 --- /dev/null +++ b/annotations_filtered/iKp5ARBBpyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.68], [16.0, 20.51], [21.0, 22.03], [31.0, 31.68], [40.0, 40.36], [43.0, 44.04], [45.0, 46.33], [52.0, 54.11], [64.0, 65.21], [72.0, 72.22], [73.0, 74.04], [74.0, 74.98], [79.0, 80.62], [82.0, 83.46], [94.0, 94.14], [100.0, 103.0], [110.0, 111.0], [124.0, 124.98], [125.0, 125.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 42.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 48.87], ["speech", 28.73], ["busy signal", 4.88]], null, null, null, null, null, null, null, [["sidetone", 38.08], ["noise", 17.7], ["music", 6.87]], null, null, null], "duration": [0.68, 4.51, 1.03, 0.68, 0.36, 1.04, 1.33, 2.11, 1.21, 0.22, 1.04, 0.98, 1.62, 1.46, 0.14, 3.0, 1.0, 0.98, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/iKqGXeX9LhQ_filtered.json b/annotations_filtered/iKqGXeX9LhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6324cbbef153b429c9946d896a26a9f6b9247f0c --- /dev/null +++ b/annotations_filtered/iKqGXeX9LhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.3], [12.0, 24.66]], "keep_status": [false, false], "silence_prob": [39.58, 43.56], "audiomae_on_audioset": [[["music", 53.65], ["speech", 13.22], ["theremin", 5.48]], [["music", 64.41], ["speech", 8.64], ["inside, small room", 2.16]]], "duration": [6.3, 12.66]} \ No newline at end of file diff --git a/annotations_filtered/iKscMa0XRXo_filtered.json b/annotations_filtered/iKscMa0XRXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d04a2c2e7a08abf9437ed2d4e9d2f1f8a7d515b --- /dev/null +++ b/annotations_filtered/iKscMa0XRXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [10.0, 10.15], [13.0, 12.66], [29.0, 31.04], [39.0, 39.01], [41.0, 41.76], [51.0, 52.59], [54.0, 55.53], [94.0, 94.61], [124.0, 124.78], [125.0, 125.52], [163.0, 164.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["single-lens reflex camera", 36.51], ["music", 10.69], ["noise", 9.08]], null, null, null, null, null, null, null, null], "duration": [0.53, 0.15, -0.34, 2.04, 0.01, 0.76, 1.59, 1.53, 0.61, 0.78, 0.52, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/iKw7Ndv4bRM_filtered.json b/annotations_filtered/iKw7Ndv4bRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f526208ec942fbc38ef7be7ebdd8703913f7c1c --- /dev/null +++ b/annotations_filtered/iKw7Ndv4bRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [7.0, 13.66], [18.0, 21.93], [25.0, 24.97]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 48.48, 91.3, 0.0], "audiomae_on_audioset": [null, [["hum", 34.15], ["speech", 26.38], ["mains hum", 24.73]], null, null], "duration": [0.95, 6.66, 3.93, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/iKzLZIbUM8o_filtered.json b/annotations_filtered/iKzLZIbUM8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2372bf86c77b199d4aefd3c50e2e3b86f403f607 --- /dev/null +++ b/annotations_filtered/iKzLZIbUM8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 61.11], [61.0, 102.02], [106.0, 139.23]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.11, 41.02, 33.23]} \ No newline at end of file diff --git a/annotations_filtered/iLBL-XeNrRI_filtered.json b/annotations_filtered/iLBL-XeNrRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03aed39cd980fe407fe9a0eb9205e91ad2e19e87 --- /dev/null +++ b/annotations_filtered/iLBL-XeNrRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.63], [32.0, 33.39], [41.0, 42.55], [45.0, 45.55], [63.0, 64.56]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.63, 1.39, 1.55, 0.55, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/iLFMRsi07_I_filtered.json b/annotations_filtered/iLFMRsi07_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/iLFMRsi07_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/iLJtz-2nkGk_filtered.json b/annotations_filtered/iLJtz-2nkGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..143cf5e937c5782a9171f4809b8e1ad3db266e70 --- /dev/null +++ b/annotations_filtered/iLJtz-2nkGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.28], [17.0, 17.47], [19.0, 20.19], [22.0, 23.68], [27.0, 35.85], [38.0, 58.28], [63.0, 63.29], [65.0, 80.37], [82.0, 84.33], [85.0, 86.32], [94.0, 102.68], [103.0, 107.79], [108.0, 109.05], [110.0, 111.03], [112.0, 112.4], [114.0, 116.6], [121.0, 125.74], [127.0, 126.87], [129.0, 130.54], [131.0, 132.06], [134.0, 157.0], [161.0, 161.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.83, 30.04, 0.0, 30.38, 29.64, 0.0, 30.83, 31.5, 0.0, 0.0, 0.0, 30.14, 30.63, 0.0, 0.0, 0.0, 32.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.94], ["speech", 22.95], ["thump, thud", 5.02]], null, [["music", 49.38], ["speech", 42.72], ["electronic music", 0.53]], [["music", 47.85], ["cacophony", 33.54], ["throbbing", 6.25]], null, [["music", 55.03], ["didgeridoo", 12.44], ["speech", 12.31]], [["speech", 41.94], ["music", 38.22], ["musical instrument", 2.24]], null, null, null, [["music", 65.64], ["musical instrument", 3.85], ["drum", 1.95]], [["speech", 49.72], ["music", 14.9], ["vehicle", 3.36]], null, null, null, [["speech", 39.5], ["music", 14.56], ["sound effect", 4.48]], null], "duration": [0.28, 0.47, 1.19, 1.68, 8.85, 20.28, 0.29, 15.37, 2.33, 1.32, 8.68, 4.79, 1.05, 1.03, 0.4, 2.6, 4.74, -0.13, 1.54, 1.06, 23.0, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/iLN9GLRC5is_filtered.json b/annotations_filtered/iLN9GLRC5is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec132a116b6006c1da9d6406e4ae5ca615a1d94e --- /dev/null +++ b/annotations_filtered/iLN9GLRC5is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.41], [16.0, 18.17], [21.0, 21.96], [30.0, 30.33], [30.0, 30.5], [31.0, 31.78], [49.0, 49.27], [54.0, 55.09], [72.0, 72.23], [76.0, 76.27], [82.0, 83.84], [85.0, 86.66], [87.0, 90.9], [93.0, 93.34], [97.0, 98.14], [112.0, 112.72], [145.0, 146.99], [147.0, 148.46], [150.0, 154.13], [157.0, 158.75], [160.0, 161.82], [165.0, 165.67], [166.0, 166.5], [168.0, 168.99], [176.0, 176.89], [187.0, 187.3], [190.0, 190.97], [192.0, 192.62], [199.0, 199.37], [201.0, 201.87], [212.0, 216.57]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.99], "audiomae_on_audioset": [null, [["music", 35.88], ["didgeridoo", 10.96], ["musical instrument", 6.66]], null, null, null, null, null, null, null, null, null, null, [["music", 57.22], ["boing", 6.01], ["didgeridoo", 4.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 48.18], ["moo", 38.63], ["livestock, farm animals, working animals", 8.96]]], "duration": [1.41, 2.17, 0.96, 0.33, 0.5, 0.78, 0.27, 1.09, 0.23, 0.27, 1.84, 1.66, 3.9, 0.34, 1.14, 0.72, 1.99, 1.46, 4.13, 1.75, 1.82, 0.67, 0.5, 0.99, 0.89, 0.3, 0.97, 0.62, 0.37, 0.87, 4.57]} \ No newline at end of file diff --git a/annotations_filtered/iLYeR6v-fVE_filtered.json b/annotations_filtered/iLYeR6v-fVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f46f22a90767818a9f5f0fb50908d08239df8994 --- /dev/null +++ b/annotations_filtered/iLYeR6v-fVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.06], [8.0, 17.09], [42.0, 47.21], [53.0, 53.64], [55.0, 55.73], [57.0, 57.13], [60.0, 64.69], [65.0, 64.83], [65.0, 64.96], [66.0, 67.66], [69.0, 69.72], [75.0, 82.0], [83.0, 84.23], [86.0, 86.8], [89.0, 89.88], [92.0, 93.11], [94.0, 95.4], [99.0, 101.09], [102.0, 103.54], [112.0, 112.77], [114.0, 115.06], [120.0, 123.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.58, 32.36, 0.0, 0.0, 0.0, 44.6, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 58.05], "audiomae_on_audioset": [null, [["music", 81.44], ["didgeridoo", 11.75], ["musical instrument", 2.99]], [["music", 71.38], ["synthesizer", 6.08], ["musical instrument", 2.54]], null, null, null, [["music", 59.0], ["speech", 9.46], ["synthesizer", 3.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 9.09, 5.21, 0.64, 0.73, 0.13, 4.69, -0.17, -0.04, 1.66, 0.72, 7.0, 1.23, 0.8, 0.88, 1.11, 1.4, 2.09, 1.54, 0.77, 1.06, 3.23]} \ No newline at end of file diff --git a/annotations_filtered/iLgMFwStTHc_filtered.json b/annotations_filtered/iLgMFwStTHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b78ef96e6e0a256bb14351a6a4895cf7231d0b1 --- /dev/null +++ b/annotations_filtered/iLgMFwStTHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.85], [10.0, 10.83], [30.0, 30.43], [32.0, 31.9], [34.0, 35.48], [36.0, 36.42], [37.0, 39.45], [40.0, 40.58], [45.0, 46.72], [57.0, 57.69], [58.0, 58.45], [61.0, 61.28], [68.0, 68.88], [70.0, 76.52], [78.0, 78.31], [79.0, 79.17], [84.0, 85.5], [87.0, 86.86], [90.0, 89.82], [91.0, 90.83], [91.0, 93.19], [94.0, 94.83], [102.0, 102.17], [103.0, 105.06], [116.0, 116.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.22, 0.0, 0.0, 43.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 59.56], ["thunk", 14.8], ["dial tone", 3.28]], null, null, null, null, null, null, [["speech", 42.29], ["sidetone", 15.9], ["fly, housefly", 4.55]], null, null, null, null, null, null, [["speech", 70.47], ["radio", 3.61], ["sidetone", 1.26]], null, null, [["speech", 38.75], ["radio", 35.6], ["sidetone", 10.56]], null], "duration": [0.85, 0.83, 0.43, -0.1, 1.48, 0.42, 2.45, 0.58, 1.72, 0.69, 0.45, 0.28, 0.88, 6.52, 0.31, 0.17, 1.5, -0.14, -0.18, -0.17, 2.19, 0.83, 0.17, 2.06, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/iM0hP-LZIvI_filtered.json b/annotations_filtered/iM0hP-LZIvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66356d2c75e62207ea1b381baa8bb0c35f49412c --- /dev/null +++ b/annotations_filtered/iM0hP-LZIvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 42.89], [44.0, 45.59], [46.0, 59.19], [60.0, 73.65]], "keep_status": [false, false, false, false], "silence_prob": [28.71, 0.0, 28.11, 28.2], "audiomae_on_audioset": [[["music", 91.64], ["electronic music", 1.41], ["didgeridoo", 1.26]], null, [["music", 38.21], ["throbbing", 22.85], ["hum", 16.04]], [["music", 79.37], ["electronic music", 3.28], ["hum", 1.9]]], "duration": [7.89, 1.59, 13.19, 13.65]} \ No newline at end of file diff --git a/annotations_filtered/iMA4bMMh44w_filtered.json b/annotations_filtered/iMA4bMMh44w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..696545ae9fe5941d01e4d9d982a5b7201afe370e --- /dev/null +++ b/annotations_filtered/iMA4bMMh44w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.25], [28.0, 31.23], [32.0, 35.23], [38.0, 39.24], [41.0, 43.83], [47.0, 48.19], [52.0, 55.65], [57.0, 58.18], [61.0, 65.26], [68.0, 69.13], [72.0, 74.76], [76.0, 76.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.85, 99.88, 99.4, 0.0, 99.96, 0.0, 98.99, 0.0, 99.05, 0.0, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.25, 3.23, 3.23, 1.24, 2.83, 1.19, 3.65, 1.18, 4.26, 1.13, 2.76, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/iMP3uLZl6UE_filtered.json b/annotations_filtered/iMP3uLZl6UE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4de022636fdb891ad7299bc58ef9e1528e83c3e8 --- /dev/null +++ b/annotations_filtered/iMP3uLZl6UE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 8.99], [12.0, 12.5], [13.0, 15.35], [16.0, 19.85], [20.0, 36.44], [38.0, 38.8], [40.0, 70.95], [72.0, 75.07], [77.0, 79.29], [80.0, 88.67], [93.0, 110.84], [112.0, 120.12]], "keep_status": [false, true, false, false, false, true, false, false, true, false, false, true, false], "silence_prob": [0.0, 28.83, 0.0, 93.76, 94.66, 48.91, 0.0, 0.0, 46.4, 50.51, 31.77, 31.63, 46.12], "audiomae_on_audioset": [null, [["noise", 20.14], ["music", 14.51], ["synthesizer", 11.92]], null, null, null, [["speech", 17.36], ["fly, housefly", 12.55], ["bee, wasp, etc.", 11.5]], null, null, [["music", 48.48], ["hum", 15.7], ["mains hum", 5.82]], null, [["music", 78.82], ["synthesizer", 3.16], ["musical instrument", 2.93]], [["music", 34.46], ["fly, housefly", 14.58], ["insect", 6.93]], [["music", 53.1], ["coin (dropping)", 15.12], ["synthesizer", 8.35]]], "duration": [1.57, 4.99, 0.5, 2.35, 3.85, 16.44, 0.8, 30.95, 3.07, 2.29, 8.67, 17.84, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/iMPV0eFLxbQ_filtered.json b/annotations_filtered/iMPV0eFLxbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f824e770b9d23741cfb65332b3ee211b82430b1a --- /dev/null +++ b/annotations_filtered/iMPV0eFLxbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.39], [15.0, 15.7], [17.0, 16.98], [19.0, 19.06], [20.0, 25.05], [35.0, 35.02], [37.0, 40.44], [41.0, 43.77], [52.0, 54.04], [56.0, 56.27], [64.0, 65.11], [68.0, 69.65], [73.0, 73.65], [75.0, 76.49], [82.0, 82.53], [88.0, 89.06], [95.0, 95.34], [100.0, 102.05], [105.0, 115.28], [116.0, 117.22], [119.0, 119.57], [121.0, 121.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 35.97, 35.93, 47.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 36.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.93], ["drum", 4.86], ["musical instrument", 3.92]], null, [["foghorn", 42.13], ["music", 24.1], ["trombone", 4.54]], [["music", 48.16], ["trombone", 11.35], ["foghorn", 10.66]], [["music", 60.28], ["foghorn", 4.47], ["musical instrument", 2.78]], null, null, null, null, null, null, null, null, null, [["music", 70.46], ["musical instrument", 6.76], ["wind instrument, woodwind instrument", 3.0]], null, null, null], "duration": [0.39, 0.7, -0.02, 0.06, 5.05, 0.02, 3.44, 2.77, 2.04, 0.27, 1.11, 1.65, 0.65, 1.49, 0.53, 1.06, 0.34, 2.05, 10.28, 1.22, 0.57, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/iMzGaN5Sg3w_filtered.json b/annotations_filtered/iMzGaN5Sg3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7eeaebdd9fca6df2183837e5e3f5b982f28474f7 --- /dev/null +++ b/annotations_filtered/iMzGaN5Sg3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [6.0, 6.81], [13.0, 13.31], [14.0, 15.6], [17.0, 23.11], [26.0, 27.35], [28.0, 29.02], [30.0, 31.31], [32.0, 35.19], [36.0, 36.68], [40.0, 41.22], [46.0, 52.25], [61.0, 61.32], [67.0, 68.86], [73.0, 73.65], [76.0, 81.48], [85.0, 85.83], [97.0, 97.85], [106.0, 106.39], [109.0, 109.53], [111.0, 115.28], [116.0, 116.82], [119.0, 119.2], [121.0, 121.19], [122.0, 123.28], [125.0, 124.7], [127.0, 127.26], [130.0, 130.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 48.27, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.4], ["noise", 17.54], ["sidetone", 4.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.81, 0.31, 1.6, 6.11, 1.35, 1.02, 1.31, 3.19, 0.68, 1.22, 6.25, 0.32, 1.86, 0.65, 5.48, 0.83, 0.85, 0.39, 0.53, 4.28, 0.82, 0.2, 0.19, 1.28, -0.3, 0.26, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/iN0ZnG7yo6o_filtered.json b/annotations_filtered/iN0ZnG7yo6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba09679bceadffb683e5938ead19d1ba7f27a4f --- /dev/null +++ b/annotations_filtered/iN0ZnG7yo6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 12.18], [14.0, 14.35], [16.0, 18.94], [20.0, 20.26], [21.0, 22.01], [27.0, 30.74], [37.0, 36.86], [44.0, 44.05], [49.0, 50.11], [51.0, 50.77], [54.0, 56.46], [58.0, 57.84], [60.0, 63.91], [65.0, 65.67], [67.0, 67.68], [70.0, 70.73], [72.0, 73.72], [77.0, 77.48], [78.0, 79.56], [81.0, 85.23], [86.0, 86.73], [93.0, 106.51], [112.0, 127.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 98.44, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 30.78, 30.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.47], ["singing", 2.82], ["rock and roll", 1.48]], [["music", 77.37], ["singing", 5.04], ["song", 2.06]]], "duration": [0.51, 7.18, 0.35, 2.94, 0.26, 1.01, 3.74, -0.14, 0.05, 1.11, -0.23, 2.46, -0.16, 3.91, 0.67, 0.68, 0.73, 1.72, 0.48, 1.56, 4.23, 0.73, 13.51, 15.25]} \ No newline at end of file diff --git a/annotations_filtered/iNQYIdE6DOg_filtered.json b/annotations_filtered/iNQYIdE6DOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2382046f39e854c358d126e279013ca1e2d67ded --- /dev/null +++ b/annotations_filtered/iNQYIdE6DOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.19], [44.0, 44.17], [46.0, 46.8], [49.0, 48.9], [51.0, 51.14], [52.0, 52.62], [54.0, 55.14], [56.0, 57.35], [58.0, 57.84], [58.0, 70.43], [73.0, 73.03], [74.0, 76.17], [78.0, 78.43], [81.0, 81.45], [84.0, 128.38], [131.0, 131.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.16, 0.0, 50.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 50.0], ["hum", 12.21], ["mains hum", 11.43]], null, null, null, null, null, null], "duration": [0.19, 0.17, 0.8, -0.1, 0.14, 0.62, 1.14, 1.35, -0.16, 12.43, 0.03, 2.17, 0.43, 0.45, 44.38, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/iNSN6QhIWeA_filtered.json b/annotations_filtered/iNSN6QhIWeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b09773ceb17397e22bd85d58400a60b191b4adaa --- /dev/null +++ b/annotations_filtered/iNSN6QhIWeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.32], [22.0, 22.6], [23.0, 30.23], [31.0, 34.75], [35.0, 37.83], [38.0, 43.12], [44.0, 44.22], [46.0, 47.85], [49.0, 49.11], [51.0, 50.82], [53.0, 56.89], [59.0, 59.7], [61.0, 61.47], [63.0, 65.45], [68.0, 109.22], [110.0, 114.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 46.09, 64.52, 54.3, 51.6, 0.0, 0.0, 0.0, 0.0, 63.31, 0.0, 0.0, 56.86, 0.0, 29.35], "audiomae_on_audioset": [null, null, [["speech", 27.63], ["music", 11.4], ["rumble", 3.86]], null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 34.89], ["hum", 29.64], ["throbbing", 8.15]]], "duration": [0.32, 0.6, 7.23, 3.75, 2.83, 5.12, 0.22, 1.85, 0.11, -0.18, 3.89, 0.7, 0.47, 2.45, 41.22, 4.62]} \ No newline at end of file diff --git a/annotations_filtered/iNUv6pnKd5s_filtered.json b/annotations_filtered/iNUv6pnKd5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c30a09fc4c809a695929c86a0de6c2f87e65977f --- /dev/null +++ b/annotations_filtered/iNUv6pnKd5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.34], [20.0, 25.69], [27.0, 27.13], [31.0, 31.5], [32.0, 32.32], [34.0, 41.35], [42.0, 43.28]], "keep_status": [true, true, false, false, false, true, false], "silence_prob": [30.72, 33.42, 0.0, 0.0, 0.0, 33.03, 0.0], "audiomae_on_audioset": [[["music", 16.01], ["hum", 13.84], ["livestock, farm animals, working animals", 11.52]], [["music", 62.5], ["synthesizer", 2.75], ["foghorn", 2.46]], null, null, null, [["music", 47.97], ["hum", 10.02], ["throbbing", 9.01]], null], "duration": [14.34, 5.69, 0.13, 0.5, 0.32, 7.35, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/iNa97wFdFyE_filtered.json b/annotations_filtered/iNa97wFdFyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7e63a7ba78063bfd46715b3383b0da4ee4608be --- /dev/null +++ b/annotations_filtered/iNa97wFdFyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [8.0, 7.97], [9.0, 11.3], [18.0, 17.81], [20.0, 21.1], [25.0, 25.49], [51.0, 51.8], [75.0, 75.69], [77.0, 83.08]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 63.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.63, -0.03, 2.3, -0.19, 1.1, 0.49, 0.8, 0.69, 6.08]} \ No newline at end of file diff --git a/annotations_filtered/iNg7uRYtqLA_filtered.json b/annotations_filtered/iNg7uRYtqLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de42fb29d09f614922dc4d52906a72c0d9c60d23 --- /dev/null +++ b/annotations_filtered/iNg7uRYtqLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.79], [18.0, 20.43], [25.0, 26.62], [27.0, 37.67], [38.0, 38.47], [42.0, 48.86], [52.0, 58.21], [60.0, 75.36], [78.0, 97.55], [98.0, 107.03], [109.0, 132.07], [142.0, 145.44], [153.0, 156.46], [164.0, 165.69], [178.0, 179.69], [193.0, 196.72], [197.0, 198.29]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [40.81, 46.43, 0.0, 38.63, 0.0, 32.36, 30.49, 31.31, 31.69, 35.87, 42.19, 33.04, 33.88, 0.0, 0.0, 32.25, 0.0], "audiomae_on_audioset": [[["music", 42.66], ["speech", 31.83], ["theremin", 4.13]], [["speech", 40.16], ["music", 34.45], ["hum", 4.63]], null, [["music", 23.12], ["fly, housefly", 12.33], ["speech", 7.66]], null, [["speech", 14.67], ["mosquito", 11.63], ["whack, thwack", 10.97]], [["music", 25.1], ["hum", 17.48], ["throbbing", 12.71]], [["music", 23.19], ["speech", 19.57], ["throbbing", 13.49]], [["speech", 61.13], ["music", 18.55], ["explosion", 1.68]], [["livestock, farm animals, working animals", 41.55], ["cattle, bovinae", 31.81], ["moo", 20.57]], [["music", 74.15], ["electronic music", 3.89], ["techno", 2.95]], [["music", 61.91], ["electronic music", 5.18], ["speech", 4.81]], [["music", 77.83], ["didgeridoo", 5.8], ["musical instrument", 3.94]], null, null, [["music", 26.32], ["cattle, bovinae", 17.57], ["moo", 10.78]], null], "duration": [5.79, 2.43, 1.62, 10.67, 0.47, 6.86, 6.21, 15.36, 19.55, 9.03, 23.07, 3.44, 3.46, 1.69, 1.69, 3.72, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/iNxUsONmig8_filtered.json b/annotations_filtered/iNxUsONmig8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4476572cd79517bffe3f112c029d53108f0256a3 --- /dev/null +++ b/annotations_filtered/iNxUsONmig8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.72], [12.0, 12.92], [18.0, 19.79], [23.0, 26.94], [34.0, 35.04], [36.0, 39.02], [41.0, 43.58], [50.0, 50.6], [52.0, 53.1], [54.0, 54.62], [59.0, 59.17], [62.0, 62.99], [67.0, 68.39], [71.0, 71.56], [73.0, 74.24], [84.0, 84.94], [94.0, 95.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 0.92, 1.79, 3.94, 1.04, 3.02, 2.58, 0.6, 1.1, 0.62, 0.17, 0.99, 1.39, 0.56, 1.24, 0.94, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/iOGo0EHHtCo_filtered.json b/annotations_filtered/iOGo0EHHtCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9d399bef5c1bcb19e134590ad1cc3a165eabbfb --- /dev/null +++ b/annotations_filtered/iOGo0EHHtCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.18], [21.0, 21.3]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.18, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/iOHElDaRs5E_filtered.json b/annotations_filtered/iOHElDaRs5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08a01bba54700e65e8e7585b765c90e19b3af530 --- /dev/null +++ b/annotations_filtered/iOHElDaRs5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.5], [19.0, 19.31], [30.0, 29.98], [38.0, 39.26], [41.0, 41.4], [42.0, 43.09], [52.0, 52.96], [54.0, 56.3], [57.0, 59.02], [70.0, 71.51], [78.0, 83.73], [89.0, 90.1], [91.0, 92.7], [105.0, 105.75], [110.0, 111.1], [112.0, 114.76], [122.0, 122.27], [126.0, 127.11], [129.0, 129.64], [137.0, 137.62], [139.0, 139.53], [147.0, 156.88], [160.0, 161.99], [171.0, 172.67]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 41.74, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sidetone", 29.7], ["speech", 21.25], ["music", 11.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 0.31, -0.02, 1.26, 0.4, 1.09, 0.96, 2.3, 2.02, 1.51, 5.73, 1.1, 1.7, 0.75, 1.1, 2.76, 0.27, 1.11, 0.64, 0.62, 0.53, 9.88, 1.99, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/iOMuP1qEKUc_filtered.json b/annotations_filtered/iOMuP1qEKUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6733cd1cfd8a181bb2fd37cf1609473c79ec7f57 --- /dev/null +++ b/annotations_filtered/iOMuP1qEKUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.37], [11.0, 41.39], [45.0, 45.99], [72.0, 75.44], [75.0, 75.47], [76.0, 76.64], [79.0, 80.27], [81.0, 80.69], [81.0, 88.47], [95.0, 95.69]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.69, 0.0, 0.0, 0.0, 0.0, 29.95, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.34], ["beatboxing", 15.88], ["didgeridoo", 6.55]], null, null, null, null, [["speech", 17.6], ["crowd", 16.5], ["cheering", 9.74]], null], "duration": [1.37, 30.39, 0.99, 3.44, 0.47, 0.64, 1.27, -0.31, 7.47, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/iOaD5cZNw0E_filtered.json b/annotations_filtered/iOaD5cZNw0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2ff3db1b460ee290acb2c842ea7af6cbd070a3b --- /dev/null +++ b/annotations_filtered/iOaD5cZNw0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.11], [16.0, 22.33], [24.0, 28.92], [33.0, 34.05], [34.0, 34.92], [42.0, 43.9], [45.0, 47.33], [49.0, 51.12], [53.0, 53.77], [55.0, 55.78], [57.0, 57.2], [58.0, 58.75], [60.0, 61.48], [62.0, 62.26], [63.0, 64.05], [65.0, 66.63], [67.0, 67.51], [71.0, 71.2], [78.0, 78.11], [78.0, 79.56], [81.0, 81.06], [81.0, 84.77], [86.0, 88.4], [90.0, 91.79], [97.0, 100.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 59.96, 71.43, 0.0, 0.0, 0.0, 78.21, 51.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 93.76, 0.0, 93.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.11, 6.33, 4.92, 1.05, 0.92, 1.9, 2.33, 2.12, 0.77, 0.78, 0.2, 0.75, 1.48, 0.26, 1.05, 1.63, 0.51, 0.2, 0.11, 1.56, 0.06, 3.77, 2.4, 1.79, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/iP7_QcV9Q9s_filtered.json b/annotations_filtered/iP7_QcV9Q9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76c38f91cd2add1dfa934963f9f025f1eba02d2e --- /dev/null +++ b/annotations_filtered/iP7_QcV9Q9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.43], [9.0, 10.32], [21.0, 23.62], [40.0, 40.96], [42.0, 43.11], [45.0, 45.69], [48.0, 48.51], [50.0, 50.31], [57.0, 58.04], [60.0, 61.16], [62.0, 62.33], [63.0, 63.68], [66.0, 69.97], [76.0, 80.05], [83.0, 84.84], [87.0, 87.25], [92.0, 93.51], [94.0, 96.36], [98.0, 103.47], [111.0, 112.63], [118.0, 135.89], [140.0, 139.82], [141.0, 145.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.07, 29.35, 0.0, 0.0, 0.0, 30.47, 28.78, 0.0, 28.68, 0.0, 29.06], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 42.81], ["moo", 40.6], ["livestock, farm animals, working animals", 14.68]], null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.72], ["livestock, farm animals, working animals", 34.95], ["moo", 26.95]], [["music", 66.32], ["speech", 5.64], ["boing", 3.85]], null, null, null, [["music", 37.74], ["speech", 18.44], ["sidetone", 9.07]], [["cattle, bovinae", 38.4], ["livestock, farm animals, working animals", 31.4], ["moo", 27.33]], null, [["music", 86.77], ["cattle, bovinae", 2.37], ["speech", 1.48]], null, [["music", 58.63], ["speech", 8.87], ["throbbing", 7.62]]], "duration": [1.43, 1.32, 2.62, 0.96, 1.11, 0.69, 0.51, 0.31, 1.04, 1.16, 0.33, 0.68, 3.97, 4.05, 1.84, 0.25, 1.51, 2.36, 5.47, 1.63, 17.89, -0.18, 4.29]} \ No newline at end of file diff --git a/annotations_filtered/iPQfwmfRq2s_filtered.json b/annotations_filtered/iPQfwmfRq2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60eb3968f3063a342e3b82f99780944782a59f23 --- /dev/null +++ b/annotations_filtered/iPQfwmfRq2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.8], [7.0, 8.01], [9.0, 9.75], [11.0, 11.62], [15.0, 21.63], [23.0, 26.05], [29.0, 37.88], [39.0, 82.49], [84.0, 90.96], [93.0, 95.18], [96.0, 100.45], [102.0, 112.87]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, true], "silence_prob": [84.62, 0.0, 0.0, 0.0, 90.6, 68.8, 39.75, 0.0, 36.9, 47.27, 49.18, 29.32], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 24.9], ["gong", 18.76], ["music", 15.54]], null, [["music", 53.13], ["scary music", 6.15], ["synthesizer", 5.31]], [["music", 43.92], ["theremin", 38.2], ["musical instrument", 3.5]], [["music", 61.52], ["theremin", 9.2], ["musical instrument", 5.59]], [["music", 51.3], ["reverberation", 6.67], ["musical instrument", 5.09]]], "duration": [3.8, 1.01, 0.75, 0.62, 6.63, 3.05, 8.88, 43.49, 6.96, 2.18, 4.45, 10.87]} \ No newline at end of file diff --git a/annotations_filtered/iPcAns5pKVw_filtered.json b/annotations_filtered/iPcAns5pKVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b99a5b722d0c12f6fa69a112872804eee35eaf9 --- /dev/null +++ b/annotations_filtered/iPcAns5pKVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.97], [20.0, 19.89], [24.0, 27.36], [28.0, 29.69], [31.0, 36.15], [41.0, 43.93], [46.0, 52.59], [56.0, 57.2], [62.0, 64.83], [66.0, 66.95], [72.0, 90.22], [92.0, 93.39], [94.0, 98.79], [105.0, 125.83]], "keep_status": [false, false, true, false, true, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.16, 0.0, 30.08, 29.95, 29.49, 0.0, 29.58, 0.0, 29.56, 0.0, 29.67, 33.46], "audiomae_on_audioset": [null, null, [["sidetone", 29.26], ["speech", 14.49], ["vehicle", 11.04]], null, [["speech", 52.06], ["vehicle", 7.75], ["fixed-wing aircraft, airplane", 6.15]], [["cattle, bovinae", 16.77], ["moo", 14.72], ["livestock, farm animals, working animals", 10.88]], [["cattle, bovinae", 43.7], ["livestock, farm animals, working animals", 30.29], ["moo", 20.44]], null, [["speech", 16.06], ["vehicle", 9.58], ["noise", 5.16]], null, [["cattle, bovinae", 45.92], ["livestock, farm animals, working animals", 30.05], ["moo", 17.95]], null, [["livestock, farm animals, working animals", 42.48], ["cattle, bovinae", 34.51], ["moo", 19.46]], [["grunt", 39.95], ["speech", 11.87], ["sound effect", 9.24]]], "duration": [1.97, -0.11, 3.36, 1.69, 5.15, 2.93, 6.59, 1.2, 2.83, 0.95, 18.22, 1.39, 4.79, 20.83]} \ No newline at end of file diff --git a/annotations_filtered/iPgcg3DVoUY_filtered.json b/annotations_filtered/iPgcg3DVoUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37e4dd9ad8748b4f7d5926a58474dd18d1c03a03 --- /dev/null +++ b/annotations_filtered/iPgcg3DVoUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.24], [14.0, 16.61], [20.0, 20.53], [23.0, 23.84], [26.0, 27.21], [32.0, 39.5], [41.0, 42.16], [45.0, 55.39], [63.0, 64.77], [66.0, 66.16], [67.0, 69.11], [73.0, 76.01], [77.0, 79.88], [82.0, 83.52], [87.0, 87.99], [89.0, 89.63], [91.0, 95.0], [98.0, 100.01], [103.0, 103.5], [105.0, 106.17], [108.0, 110.54], [114.0, 116.5], [120.0, 123.36]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, true, false, true], "silence_prob": [0.0, 30.36, 0.0, 0.0, 0.0, 29.54, 0.0, 28.32, 0.0, 0.0, 29.17, 30.41, 31.22, 0.0, 0.0, 0.0, 30.44, 32.84, 0.0, 0.0, 31.55, 31.06, 31.17], "audiomae_on_audioset": [null, [["music", 18.2], ["hum", 13.3], ["rumble", 11.14]], null, null, null, [["hum", 48.62], ["throbbing", 22.18], ["mains hum", 17.12]], null, [["hum", 38.76], ["mains hum", 37.22], ["music", 6.62]], null, null, [["music", 63.03], ["throbbing", 5.35], ["hum", 5.02]], [["hum", 51.17], ["mains hum", 20.49], ["throbbing", 12.41]], [["speech", 33.3], ["hum", 20.47], ["music", 11.71]], null, null, null, [["music", 31.42], ["hum", 26.02], ["mains hum", 9.59]], [["mains hum", 16.11], ["hum", 14.05], ["music", 11.7]], null, null, [["speech", 34.56], ["hum", 14.86], ["mains hum", 10.37]], [["hum", 47.47], ["mains hum", 33.78], ["throbbing", 6.57]], [["music", 24.81], ["speech", 21.28], ["hum", 13.02]]], "duration": [0.24, 2.61, 0.53, 0.84, 1.21, 7.5, 1.16, 10.39, 1.77, 0.16, 2.11, 3.01, 2.88, 1.52, 0.99, 0.63, 4.0, 2.01, 0.5, 1.17, 2.54, 2.5, 3.36]} \ No newline at end of file diff --git a/annotations_filtered/iPt2PNpjOq4_filtered.json b/annotations_filtered/iPt2PNpjOq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/iPt2PNpjOq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/iQISI7DOVCY_filtered.json b/annotations_filtered/iQISI7DOVCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..007a187369fe526b3580b276b2c5670b40e87cfb --- /dev/null +++ b/annotations_filtered/iQISI7DOVCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.19], [26.0, 31.7], [34.0, 37.67], [39.0, 62.38], [63.0, 73.99], [74.0, 75.71], [76.0, 81.87], [90.0, 92.25], [93.0, 94.76], [105.0, 106.39], [110.0, 111.94], [115.0, 128.98], [130.0, 131.31]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.33, 35.03, 30.58, 32.92, 0.0, 59.77, 76.86, 0.0, 0.0, 0.0, 56.48, 0.0], "audiomae_on_audioset": [null, [["speech", 27.98], ["music", 13.16], ["car", 10.41]], [["music", 25.67], ["hum", 23.32], ["speech", 15.61]], [["music", 89.12], ["throbbing", 2.28], ["scary music", 1.03]], [["music", 24.7], ["didgeridoo", 18.73], ["speech", 13.88]], null, null, null, null, null, null, null, null], "duration": [1.19, 5.7, 3.67, 23.38, 10.99, 1.71, 5.87, 2.25, 1.76, 1.39, 1.94, 13.98, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/iQJh6I8kH_E_filtered.json b/annotations_filtered/iQJh6I8kH_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/iQJh6I8kH_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/iR-4e37VUPo_filtered.json b/annotations_filtered/iR-4e37VUPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7694fab2b012d0008abd070eed8300edce7507c --- /dev/null +++ b/annotations_filtered/iR-4e37VUPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.94], [43.0, 44.46], [46.0, 47.34], [65.0, 67.95]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.09], "audiomae_on_audioset": [null, null, null, [["grunt", 32.22], ["groan", 28.15], ["speech", 18.2]]], "duration": [1.94, 1.46, 1.34, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/iRIIcZuSiBo_filtered.json b/annotations_filtered/iRIIcZuSiBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8e465b4beedeedec3575a55d46ad754efa62264 --- /dev/null +++ b/annotations_filtered/iRIIcZuSiBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [6.0, 6.64], [9.0, 14.61], [15.0, 14.99], [16.0, 43.88], [44.0, 79.86]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.35, 0.0, 33.63, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 34.21], ["moo", 23.61], ["cattle, bovinae", 22.54]], null, [["music", 64.45], ["speech", 8.87], ["electronic music", 4.11]], null], "duration": [0.99, 0.64, 5.61, -0.01, 27.88, 35.86]} \ No newline at end of file diff --git a/annotations_filtered/iRIxb6_ELNg_filtered.json b/annotations_filtered/iRIxb6_ELNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a79b81aa78dfaeca644b1dc9175846b06e1f1501 --- /dev/null +++ b/annotations_filtered/iRIxb6_ELNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.55], [9.0, 11.48], [13.0, 18.17], [19.0, 21.09], [22.0, 27.04], [29.0, 31.46], [33.0, 38.35], [39.0, 43.12], [44.0, 49.1], [49.0, 51.54], [52.0, 64.18], [66.0, 67.88], [70.0, 72.01], [79.0, 80.0], [84.0, 84.45], [97.0, 98.66], [106.0, 106.88], [116.0, 116.99]], "keep_status": [true, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [48.82, 87.74, 92.15, 94.81, 95.09, 92.97, 96.29, 42.11, 49.78, 49.97, 99.95, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 24.65], ["guitar", 16.09], ["speech", 15.29]], null, null, null, null, null, null, [["speech", 30.84], ["sine wave", 18.99], ["dial tone", 16.16]], [["speech", 50.49], ["sidetone", 13.32], ["sine wave", 4.99]], [["speech", 53.33], ["hiccup", 3.8], ["sine wave", 3.7]], null, null, null, null, null, null, null, null], "duration": [3.55, 2.48, 5.17, 2.09, 5.04, 2.46, 5.35, 4.12, 5.1, 2.54, 12.18, 1.88, 2.01, 1.0, 0.45, 1.66, 0.88, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/iRd63BXG6nE_filtered.json b/annotations_filtered/iRd63BXG6nE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8ee0d99fdf02315bf03afa446601ff2d79a244d --- /dev/null +++ b/annotations_filtered/iRd63BXG6nE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.58], [12.0, 22.35], [23.0, 23.9], [26.0, 30.74], [35.0, 35.82], [37.0, 45.76], [46.0, 50.53], [52.0, 52.86], [53.0, 54.57], [55.0, 55.53], [57.0, 57.28], [58.0, 60.02], [63.0, 62.97], [71.0, 71.47], [73.0, 75.36], [78.0, 79.15], [80.0, 80.72], [87.0, 87.86], [89.0, 89.63], [91.0, 91.44], [99.0, 99.12], [100.0, 102.79], [106.0, 106.83], [111.0, 116.11], [120.0, 120.09], [124.0, 123.77], [125.0, 125.83], [127.0, 126.66], [127.0, 126.74], [127.0, 126.77], [128.0, 128.46], [139.0, 139.72], [140.0, 141.59], [142.0, 146.38], [147.0, 149.27], [151.0, 151.82], [152.0, 167.39], [168.0, 168.89], [170.0, 173.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.44, 83.52, 0.0, 94.37, 0.0, 91.3, 84.25, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 99.44, 0.0, 99.44, 0.0, 97.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.58, 10.35, 0.9, 4.74, 0.82, 8.76, 4.53, 0.86, 1.57, 0.53, 0.28, 2.02, -0.03, 0.47, 2.36, 1.15, 0.72, 0.86, 0.63, 0.44, 0.12, 2.79, 0.83, 5.11, 0.09, -0.23, 0.83, -0.34, -0.26, -0.23, 0.46, 0.72, 1.59, 4.38, 2.27, 0.82, 15.39, 0.89, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/iRdSH-u1wWI_filtered.json b/annotations_filtered/iRdSH-u1wWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ef1ed4d38b8c70d42e6de9240ac89e8d0a59ea --- /dev/null +++ b/annotations_filtered/iRdSH-u1wWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 43.34], [44.0, 44.64], [66.0, 66.24], [71.0, 81.45]], "keep_status": [true, false, false, true], "silence_prob": [30.21, 0.0, 0.0, 28.25], "audiomae_on_audioset": [[["didgeridoo", 27.86], ["music", 20.62], ["foghorn", 8.54]], null, null, [["music", 27.59], ["speech", 20.49], ["fly, housefly", 4.98]]], "duration": [19.34, 0.64, 0.24, 10.45]} \ No newline at end of file diff --git a/annotations_filtered/iRdTetA_Dqo_filtered.json b/annotations_filtered/iRdTetA_Dqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dd2b39d6b25fbc8e5a27bceaa4bbe01f8c7a224 --- /dev/null +++ b/annotations_filtered/iRdTetA_Dqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.72], [9.0, 10.18], [19.0, 19.04], [21.0, 20.66], [21.0, 24.58], [29.0, 29.73], [51.0, 57.67], [59.0, 60.12], [62.0, 63.39], [66.0, 66.58], [68.0, 68.84], [71.0, 72.13], [75.0, 75.84], [79.0, 80.64], [83.0, 87.42]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.91, 0.0, 0.0, 0.0, 45.46, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07], "audiomae_on_audioset": [[["speech", 54.05], ["music", 9.2], ["hum", 3.77]], null, null, null, [["speech", 29.48], ["throbbing", 22.63], ["sidetone", 17.5]], null, null, null, null, null, null, null, null, null, null], "duration": [3.72, 1.18, 0.04, -0.34, 3.58, 0.73, 6.67, 1.12, 1.39, 0.58, 0.84, 1.13, 0.84, 1.64, 4.42]} \ No newline at end of file diff --git a/annotations_filtered/iReLGcSZtwI_filtered.json b/annotations_filtered/iReLGcSZtwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87cc3ff036f2f7a1b165f968f2e7e6a3a1f3a5cf --- /dev/null +++ b/annotations_filtered/iReLGcSZtwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.1], [14.0, 47.68]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.1, 33.68]} \ No newline at end of file diff --git a/annotations_filtered/iRmIef02Ajk_filtered.json b/annotations_filtered/iRmIef02Ajk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3dcbd3496dd6fb6e992e15a0b6604c44c63f881 --- /dev/null +++ b/annotations_filtered/iRmIef02Ajk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.99], [6.0, 6.98], [11.0, 11.64], [13.0, 13.9], [18.0, 18.86], [20.0, 21.57], [23.0, 23.92], [25.0, 26.3], [30.0, 34.03], [36.0, 36.66], [37.0, 42.79], [44.0, 45.49], [47.0, 55.38], [57.0, 67.31], [69.0, 70.43], [72.0, 72.89], [74.0, 75.24], [76.0, 78.68], [80.0, 80.22], [82.0, 85.28], [87.0, 93.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 47.9, 0.0, 32.08, 29.95, 0.0, 0.0, 0.0, 33.34, 0.0, 36.73, 31.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 20.49], ["music", 17.95], ["singing bowl", 16.49]], null, [["music", 33.66], ["theremin", 21.13], ["wind instrument, woodwind instrument", 11.66]], [["music", 48.31], ["musical instrument", 9.43], ["theremin", 6.4]], null, null, null, [["theremin", 62.58], ["music", 20.77], ["musical instrument", 4.32]], null, [["music", 45.62], ["musical instrument", 14.41], ["theremin", 9.7]], [["theremin", 39.49], ["music", 27.71], ["violin, fiddle", 6.11]]], "duration": [1.99, 0.98, 0.64, 0.9, 0.86, 1.57, 0.92, 1.3, 4.03, 0.66, 5.79, 1.49, 8.38, 10.31, 1.43, 0.89, 1.24, 2.68, 0.22, 3.28, 6.45]} \ No newline at end of file diff --git a/annotations_filtered/iRmtQ5DlvuQ_filtered.json b/annotations_filtered/iRmtQ5DlvuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdbeb3a508893788aa90913bbddc249d0b884fc9 --- /dev/null +++ b/annotations_filtered/iRmtQ5DlvuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [6.0, 9.46], [10.0, 14.25], [16.0, 37.94], [39.0, 44.02]], "keep_status": [false, false, false, true, true], "silence_prob": [0.0, 89.72, 79.59, 33.71, 33.85], "audiomae_on_audioset": [null, null, null, [["speech", 30.77], ["music", 29.29], ["hum", 7.11]], [["explosion", 27.58], ["fly, housefly", 11.1], ["music", 8.15]]], "duration": [0.92, 3.46, 4.25, 21.94, 5.02]} \ No newline at end of file diff --git a/annotations_filtered/iSio5xjSYqs_filtered.json b/annotations_filtered/iSio5xjSYqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5eea7217cdb76ced5bd0bb440b1a2f91bca3938e --- /dev/null +++ b/annotations_filtered/iSio5xjSYqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 24.41], [26.0, 76.89], [79.0, 86.14], [91.0, 103.32], [107.0, 126.3]], "keep_status": [false, false, true, true, true], "silence_prob": [30.03, 0.0, 29.38, 29.56, 29.11], "audiomae_on_audioset": [[["hum", 44.72], ["throbbing", 24.36], ["mains hum", 14.49]], null, [["hum", 27.01], ["mains hum", 25.65], ["music", 10.89]], [["music", 31.96], ["hum", 15.15], ["mains hum", 12.85]], [["buzz", 14.22], ["electric shaver, electric razor", 13.21], ["music", 12.33]]], "duration": [19.41, 50.89, 7.14, 12.32, 19.3]} \ No newline at end of file diff --git a/annotations_filtered/iTLUzEjV3Bg_filtered.json b/annotations_filtered/iTLUzEjV3Bg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a950f5c5c74fd980e05923d871049e315db7885e --- /dev/null +++ b/annotations_filtered/iTLUzEjV3Bg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [4.0, 4.8], [6.0, 9.93], [14.0, 18.49], [20.0, 22.87], [24.0, 28.24], [33.0, 33.44], [34.0, 34.92], [39.0, 39.18], [47.0, 48.19], [53.0, 53.76], [56.0, 57.16], [70.0, 70.61], [74.0, 74.88], [76.0, 76.94], [81.0, 80.76], [90.0, 91.4], [96.0, 97.63], [98.0, 100.2], [103.0, 103.55], [105.0, 107.27], [109.0, 111.81]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.28, 34.38, 32.3, 35.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 78.72, 34.56], "audiomae_on_audioset": [null, null, [["music", 26.72], ["hum", 20.6], ["mains hum", 10.87]], [["music", 58.29], ["ambient music", 7.34], ["hum", 6.86]], [["music", 26.89], ["didgeridoo", 20.27], ["musical instrument", 7.77]], [["hum", 32.69], ["mains hum", 20.52], ["didgeridoo", 10.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.97], ["hum", 13.72], ["throbbing", 7.74]]], "duration": [0.43, 0.8, 3.93, 4.49, 2.87, 4.24, 0.44, 0.92, 0.18, 1.19, 0.76, 1.16, 0.61, 0.88, 0.94, -0.24, 1.4, 1.63, 2.2, 0.55, 2.27, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/iTQ4b0d3HxM_filtered.json b/annotations_filtered/iTQ4b0d3HxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..478192bfffb3ffbcd3fd969894d7355c90393a75 --- /dev/null +++ b/annotations_filtered/iTQ4b0d3HxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.27], [9.0, 9.58], [11.0, 12.07], [17.0, 17.09], [19.0, 18.79], [21.0, 21.42], [23.0, 23.38], [28.0, 28.65], [34.0, 34.87], [37.0, 37.57], [38.0, 39.82], [51.0, 51.63], [53.0, 53.7], [59.0, 60.13], [66.0, 69.4], [70.0, 71.39], [73.0, 73.75], [77.0, 78.16], [80.0, 80.7], [83.0, 83.49], [87.0, 92.91], [104.0, 110.19], [113.0, 117.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 48.52, 54.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.29], ["mains hum", 15.95], ["throbbing", 6.95]], null, null, null, null, null, [["hum", 40.54], ["mains hum", 24.51], ["speech", 11.41]], [["hum", 62.34], ["mains hum", 19.0], ["throbbing", 9.37]], null], "duration": [1.27, 0.58, 1.07, 0.09, -0.21, 0.42, 0.38, 0.65, 0.87, 0.57, 1.82, 0.63, 0.7, 1.13, 3.4, 1.39, 0.75, 1.16, 0.7, 0.49, 5.91, 6.19, 4.66]} \ No newline at end of file diff --git a/annotations_filtered/iTXqcn1qyCk_filtered.json b/annotations_filtered/iTXqcn1qyCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8f311f9059abc938f1abf79c0b4afe0ceff914 --- /dev/null +++ b/annotations_filtered/iTXqcn1qyCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [10.0, 11.2], [16.0, 16.39], [18.0, 19.23], [20.0, 20.04], [21.0, 22.33], [23.0, 24.58], [27.0, 28.29], [29.0, 29.34], [30.0, 31.13], [33.0, 33.66], [35.0, 36.09], [37.0, 37.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 1.2, 0.39, 1.23, 0.04, 1.33, 1.58, 1.29, 0.34, 1.13, 0.66, 1.09, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/iTiWC8GpOgM_filtered.json b/annotations_filtered/iTiWC8GpOgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9053faad007203090ee9e6082327f6f73289d290 --- /dev/null +++ b/annotations_filtered/iTiWC8GpOgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.94], [15.0, 16.28], [17.0, 16.63], [17.0, 17.91], [21.0, 22.67], [23.0, 25.19], [27.0, 28.48], [29.0, 30.25], [31.0, 31.87], [33.0, 33.56], [34.0, 35.29], [36.0, 37.5], [38.0, 38.31], [43.0, 47.17], [50.0, 49.59], [50.0, 51.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.63, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 32.23], ["speech", 26.58], ["whale vocalization", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.94, 1.28, -0.37, 0.91, 1.67, 2.19, 1.48, 1.25, 0.87, 0.56, 1.29, 1.5, 0.31, 4.17, -0.41, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/iTlkXQH-sdg_filtered.json b/annotations_filtered/iTlkXQH-sdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c46035dbe355bb6be9bf23ed03cbe1b39fbb070e --- /dev/null +++ b/annotations_filtered/iTlkXQH-sdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [5.0, 6.03], [8.0, 8.97], [13.0, 26.08], [30.0, 30.89], [34.0, 34.57], [38.0, 39.01], [40.0, 41.47], [44.0, 45.35], [46.0, 47.55], [51.0, 62.36], [64.0, 79.78], [82.0, 126.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.68, 31.77, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.85], ["hum", 22.39], ["mains hum", 14.45]], null, null, null, null, null, null, [["music", 38.67], ["hum", 29.23], ["throbbing", 14.39]], [["music", 74.3], ["throbbing", 5.25], ["musical instrument", 4.42]], null], "duration": [1.1, 1.03, 0.97, 13.08, 0.89, 0.57, 1.01, 1.47, 1.35, 1.55, 11.36, 15.78, 44.94]} \ No newline at end of file diff --git a/annotations_filtered/iTwIwfvNJLk_filtered.json b/annotations_filtered/iTwIwfvNJLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a07af9e0cfe9e942c7dcd5094d6a5e68cdcf3704 --- /dev/null +++ b/annotations_filtered/iTwIwfvNJLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 0.58], [2.0, 2.44], [4.0, 5.76], [11.0, 11.08], [12.0, 14.47], [16.0, 16.73], [19.0, 20.14], [21.0, 22.44], [24.0, 24.56], [26.0, 30.1], [32.0, 32.53], [34.0, 34.94], [36.0, 36.56], [41.0, 42.43], [43.0, 43.44], [50.0, 50.43], [55.0, 55.71], [57.0, 57.99], [60.0, 62.45], [64.0, 65.58], [69.0, 68.89], [72.0, 72.84], [74.0, 74.53], [75.0, 77.55], [79.0, 81.68], [84.0, 85.21], [87.0, 88.91], [90.0, 91.18], [96.0, 97.38], [99.0, 99.18], [101.0, 101.7], [104.0, 104.63], [106.0, 106.81], [108.0, 116.4], [123.0, 123.94], [126.0, 127.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 88.1, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, -0.42, 0.44, 1.76, 0.08, 2.47, 0.73, 1.14, 1.44, 0.56, 4.1, 0.53, 0.94, 0.56, 1.43, 0.44, 0.43, 0.71, 0.99, 2.45, 1.58, -0.11, 0.84, 0.53, 2.55, 2.68, 1.21, 1.91, 1.18, 1.38, 0.18, 0.7, 0.63, 0.81, 8.4, 0.94, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/iU0CuPH7akM_filtered.json b/annotations_filtered/iU0CuPH7akM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2c5c00ca5eee0718cfbe9ced0c82db084c41348 --- /dev/null +++ b/annotations_filtered/iU0CuPH7akM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.96], [13.0, 13.51], [16.0, 17.07], [25.0, 27.65], [31.0, 31.18], [36.0, 36.41], [38.0, 38.65], [43.0, 44.07], [45.0, 45.94], [49.0, 51.04], [54.0, 55.41], [60.0, 59.97], [62.0, 65.91], [70.0, 70.48], [72.0, 71.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 32.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.49], ["busy signal", 14.91], ["quack", 6.19]], null, null], "duration": [-0.04, 0.51, 1.07, 2.65, 0.18, 0.41, 0.65, 1.07, 0.94, 2.04, 1.41, -0.03, 3.91, 0.48, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/iVoG7CivnH0_filtered.json b/annotations_filtered/iVoG7CivnH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d310946d5d5d19ac9f349b49f3b03708030ce9db --- /dev/null +++ b/annotations_filtered/iVoG7CivnH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.51], [7.0, 7.08], [12.0, 16.6], [17.0, 19.68], [22.0, 23.3], [26.0, 26.43], [27.0, 31.53], [32.0, 34.21], [35.0, 39.26], [40.0, 42.31], [44.0, 43.77], [45.0, 47.66], [49.0, 50.73], [52.0, 52.27], [58.0, 58.29], [59.0, 60.79], [61.0, 63.27], [65.0, 65.67], [72.0, 76.0], [78.0, 78.73]], "keep_status": [true, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [40.19, 0.0, 48.23, 43.15, 0.0, 0.0, 48.44, 36.68, 60.89, 40.79, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 43.03, 0.0], "audiomae_on_audioset": [[["mains hum", 14.86], ["fly, housefly", 13.39], ["whale vocalization", 9.52]], null, [["fly, housefly", 18.41], ["bee, wasp, etc.", 15.37], ["hum", 14.43]], [["hum", 51.71], ["mains hum", 21.75], ["throbbing", 8.34]], null, null, [["mains hum", 44.57], ["hum", 18.7], ["music", 7.31]], [["hum", 48.58], ["throbbing", 12.95], ["stomach rumble", 11.85]], null, [["moo", 25.13], ["cattle, bovinae", 23.21], ["speech", 15.06]], null, null, null, null, null, null, [["music", 23.77], ["hum", 18.94], ["speech", 15.6]], null, [["throbbing", 24.04], ["hum", 13.15], ["fart", 10.85]], null], "duration": [3.51, 0.08, 4.6, 2.68, 1.3, 0.43, 4.53, 2.21, 4.26, 2.31, -0.23, 2.66, 1.73, 0.27, 0.29, 1.79, 2.27, 0.67, 4.0, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/iVsfWht3zmo_filtered.json b/annotations_filtered/iVsfWht3zmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b01bc4fa5d9cb3a904f498d9a18670852a5836c --- /dev/null +++ b/annotations_filtered/iVsfWht3zmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.31], [15.0, 17.47], [18.0, 22.22], [25.0, 47.95], [60.0, 60.35], [62.0, 62.18], [75.0, 106.35]], "keep_status": [true, false, true, true, false, false, false], "silence_prob": [39.37, 32.46, 32.33, 29.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.64], ["didgeridoo", 8.98], ["speech", 6.97]], [["music", 57.67], ["didgeridoo", 13.05], ["musical instrument", 2.58]], [["music", 54.45], ["didgeridoo", 8.86], ["noise", 5.4]], [["music", 25.74], ["hum", 23.14], ["mains hum", 18.55]], null, null, null], "duration": [7.31, 2.47, 4.22, 22.95, 0.35, 0.18, 31.35]} \ No newline at end of file diff --git a/annotations_filtered/iWGL8PRdM7E_filtered.json b/annotations_filtered/iWGL8PRdM7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d16047bb14711a98ff87e9fb20ab4a7025578eb6 --- /dev/null +++ b/annotations_filtered/iWGL8PRdM7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 44.81], [46.0, 49.76], [51.0, 76.33]], "keep_status": [false, false, false], "silence_prob": [0.0, 32.58, 63.31], "audiomae_on_audioset": [null, [["music", 48.59], ["gong", 19.74], ["musical instrument", 5.13]], null], "duration": [31.81, 3.76, 25.33]} \ No newline at end of file diff --git a/annotations_filtered/iWJTDTs9ymk_filtered.json b/annotations_filtered/iWJTDTs9ymk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7105a2ed57d6b0fa5b4df751e2af0f3c1b2227fa --- /dev/null +++ b/annotations_filtered/iWJTDTs9ymk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.09], [10.0, 10.35], [23.0, 23.38], [24.0, 25.47], [27.0, 27.16], [28.0, 29.79], [33.0, 32.95], [34.0, 35.02], [50.0, 50.33], [52.0, 52.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.35, 0.38, 1.47, 0.16, 1.79, -0.05, 1.02, 0.33, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/iWW0Tk58kXM_filtered.json b/annotations_filtered/iWW0Tk58kXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f080d224f59faadc7d6e1867add86cbd7815e515 --- /dev/null +++ b/annotations_filtered/iWW0Tk58kXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 59.09], [62.0, 64.72], [66.0, 66.58], [68.0, 78.73], [81.0, 86.22], [92.0, 95.32], [97.0, 97.83]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 38.1, 0.0, 33.71, 33.35, 34.21, 0.0], "audiomae_on_audioset": [null, [["music", 50.96], ["alarm clock", 12.19], ["synthesizer", 7.27]], null, [["music", 37.67], ["speech", 17.69], ["theremin", 11.69]], [["music", 84.09], ["speech", 1.77], ["electronic music", 1.51]], [["music", 51.81], ["speech", 12.93], ["throbbing", 9.79]], null], "duration": [32.09, 2.72, 0.58, 10.73, 5.22, 3.32, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/iX-nnY0x-SE_filtered.json b/annotations_filtered/iX-nnY0x-SE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42cfd41bd4c0f89d17324ce9818007c27342150e --- /dev/null +++ b/annotations_filtered/iX-nnY0x-SE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [9.0, 10.54], [12.0, 12.04], [13.0, 14.55], [16.0, 17.74], [19.0, 19.67], [24.0, 24.24], [25.0, 26.0], [27.0, 27.78], [29.0, 30.33], [54.0, 54.31], [57.0, 57.15], [67.0, 67.49], [69.0, 69.4], [71.0, 72.71], [85.0, 85.02], [91.0, 91.59], [93.0, 93.58], [95.0, 95.4], [96.0, 96.58], [99.0, 98.88], [106.0, 106.42], [108.0, 108.57], [119.0, 120.43], [131.0, 131.87], [133.0, 133.68], [137.0, 139.04], [144.0, 145.52], [147.0, 147.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.56], ["speech", 14.78], ["didgeridoo", 7.02]], null, null], "duration": [0.86, 1.54, 0.04, 1.55, 1.74, 0.67, 0.24, 1.0, 0.78, 1.33, 0.31, 0.15, 0.49, 0.4, 1.71, 0.02, 0.59, 0.58, 0.4, 0.58, -0.12, 0.42, 0.57, 1.43, 0.87, 0.68, 2.04, 1.52, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/iX1ha-hADlU_filtered.json b/annotations_filtered/iX1ha-hADlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7629fde919664e106be090472cda12516e40442 --- /dev/null +++ b/annotations_filtered/iX1ha-hADlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [6.0, 6.89], [9.0, 10.23], [13.0, 13.05], [14.0, 15.82], [17.0, 18.86], [21.0, 21.74], [25.0, 25.32], [26.0, 26.92], [31.0, 37.35], [39.0, 42.58], [47.0, 47.66], [49.0, 50.33], [52.0, 54.18], [55.0, 55.31], [56.0, 56.54], [60.0, 62.16], [63.0, 65.82], [73.0, 73.43], [82.0, 83.78], [87.0, 88.64], [90.0, 92.26], [96.0, 96.6], [98.0, 98.61], [102.0, 103.03], [110.0, 110.74], [115.0, 117.9], [122.0, 123.35], [125.0, 127.35], [129.0, 130.76], [133.0, 133.03], [136.0, 136.43], [137.0, 139.83], [142.0, 142.45], [145.0, 147.19], [149.0, 149.25], [150.0, 151.66], [152.0, 152.91], [154.0, 154.45], [155.0, 157.28], [159.0, 160.71], [161.0, 162.95], [165.0, 167.07], [169.0, 169.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.96, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.97, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 0.89, 1.23, 0.05, 1.82, 1.86, 0.74, 0.32, 0.92, 6.35, 3.58, 0.66, 1.33, 2.18, 0.31, 0.54, 2.16, 2.82, 0.43, 1.78, 1.64, 2.26, 0.6, 0.61, 1.03, 0.74, 2.9, 1.35, 2.35, 1.76, 0.03, 0.43, 2.83, 0.45, 2.19, 0.25, 1.66, 0.91, 0.45, 2.28, 1.71, 1.95, 2.07, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/iX23r272kqg_filtered.json b/annotations_filtered/iX23r272kqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a244f51a88be8968c7351f2c2fb08a1cd9bf1249 --- /dev/null +++ b/annotations_filtered/iX23r272kqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [7.0, 8.8], [12.0, 17.54], [19.0, 21.03], [23.0, 22.91], [25.0, 27.55], [29.0, 33.42], [35.0, 40.8], [42.0, 42.65], [43.0, 50.35], [52.0, 52.49], [53.0, 53.84], [58.0, 58.09], [60.0, 61.82], [64.0, 67.05], [70.0, 79.19], [80.0, 83.52], [84.0, 90.91]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 46.75, 62.47, 0.0, 41.1, 51.66, 44.34, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 34.59, 35.63, 34.16, 32.38], "audiomae_on_audioset": [null, null, [["music", 40.17], ["didgeridoo", 14.58], ["synthesizer", 4.41]], null, null, [["music", 22.09], ["moo", 17.47], ["cattle, bovinae", 14.17]], null, [["music", 53.26], ["guitar", 10.29], ["musical instrument", 8.34]], null, null, null, null, null, null, [["trombone", 31.21], ["brass instrument", 28.59], ["music", 25.89]], [["music", 56.03], ["musical instrument", 7.64], ["drum", 3.85]], [["music", 49.6], ["harmonic", 3.56], ["vibraphone", 2.44]], [["music", 68.61], ["musical instrument", 6.89], ["bass guitar", 6.48]]], "duration": [0.94, 1.8, 5.54, 2.03, -0.09, 2.55, 4.42, 5.8, 0.65, 7.35, 0.49, 0.84, 0.09, 1.82, 3.05, 9.19, 3.52, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/iXSKAf6h5vE_filtered.json b/annotations_filtered/iXSKAf6h5vE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a71ca109f95d6afe65d22c5f4675aab0b9dd66a --- /dev/null +++ b/annotations_filtered/iXSKAf6h5vE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.09], [47.0, 85.83], [87.0, 131.35]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [1.09, 38.83, 44.35]} \ No newline at end of file diff --git a/annotations_filtered/iXfhOj2PobA_filtered.json b/annotations_filtered/iXfhOj2PobA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea39a863ba8011f88b195529e6f9534f73c6ea06 --- /dev/null +++ b/annotations_filtered/iXfhOj2PobA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 72.93], [77.0, 77.14], [78.0, 82.29], [84.0, 90.71], [96.0, 111.27], [115.0, 115.86], [117.0, 125.83], [127.0, 127.18], [134.0, 136.46], [138.0, 139.45], [141.0, 144.1], [148.0, 152.9], [161.0, 161.99], [163.0, 164.05], [167.0, 168.72], [171.0, 171.81]], "keep_status": [false, false, true, false, true, false, true, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 29.61, 30.65, 30.61, 0.0, 30.26, 0.0, 30.4, 0.0, 32.56, 30.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 24.24], ["music", 15.27], ["buzz", 12.36]], [["music", 64.04], ["throbbing", 4.15], ["electronic music", 2.39]], [["music", 32.36], ["speech", 23.95], ["hum", 11.29]], null, [["music", 21.03], ["speech", 13.03], ["vehicle", 9.12]], null, [["music", 28.24], ["vehicle", 8.72], ["hum", 5.83]], null, [["speech", 27.65], ["music", 15.56], ["hum", 13.8]], [["buzz", 17.37], ["vehicle", 11.23], ["music", 8.94]], null, null, null, null], "duration": [33.93, 0.14, 4.29, 6.71, 15.27, 0.86, 8.83, 0.18, 2.46, 1.45, 3.1, 4.9, 0.99, 1.05, 1.72, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/iXo8qxLvcSs_filtered.json b/annotations_filtered/iXo8qxLvcSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13d8305ccec3e5dbb5e103e98cfdf22852a00b67 --- /dev/null +++ b/annotations_filtered/iXo8qxLvcSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 39.58], [41.0, 40.93], [42.0, 43.5], [44.0, 44.85], [49.0, 49.91], [51.0, 51.11], [53.0, 54.08], [54.0, 61.94], [63.0, 65.5], [67.0, 70.55], [71.0, 75.93], [77.0, 81.28], [82.0, 83.88], [85.0, 132.53], [137.0, 155.78], [158.0, 167.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 89.9, 99.99, 97.64, 99.95, 0.0, 0.0, 30.76, 30.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.26], ["buzz", 15.14], ["throbbing", 7.55]], [["speech", 52.48], ["radio", 5.47], ["electric shaver, electric razor", 4.93]]], "duration": [0.58, -0.07, 1.5, 0.85, 0.91, 0.11, 1.08, 7.94, 2.5, 3.55, 4.93, 4.28, 1.88, 47.53, 18.78, 9.64]} \ No newline at end of file diff --git a/annotations_filtered/iY2xD9VKDiE_filtered.json b/annotations_filtered/iY2xD9VKDiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c72092172543866674146b395703b7f40d26eda0 --- /dev/null +++ b/annotations_filtered/iY2xD9VKDiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 43.73], [49.0, 102.27], [102.0, 102.44], [109.0, 109.92], [110.0, 135.28]], "keep_status": [false, false, false, false, false], "silence_prob": [36.68, 0.0, 0.0, 0.0, 28.76], "audiomae_on_audioset": [[["music", 51.12], ["didgeridoo", 13.13], ["speech", 10.38]], null, null, null, [["mains hum", 29.3], ["hum", 24.59], ["music", 18.82]]], "duration": [2.73, 53.27, 0.44, 0.92, 25.28]} \ No newline at end of file diff --git a/annotations_filtered/iY5fvk3H2Js_filtered.json b/annotations_filtered/iY5fvk3H2Js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97507587009e025c2f0ec6063a250655a206de63 --- /dev/null +++ b/annotations_filtered/iY5fvk3H2Js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [5.0, 23.68], [24.0, 24.66], [26.0, 26.2], [27.0, 27.68], [29.0, 29.2], [30.0, 31.19], [34.0, 35.4], [38.0, 38.62], [43.0, 43.24], [45.0, 46.13], [48.0, 49.0], [61.0, 64.64], [70.0, 70.44], [72.0, 73.3], [75.0, 75.14], [77.0, 79.68], [82.0, 82.71], [84.0, 84.5], [97.0, 101.24], [102.0, 102.88], [103.0, 118.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.63, 0.0, 0.0, 0.0, 38.58, 0.0, 0.0, 37.22, 0.0, 35.54], "audiomae_on_audioset": [null, [["music", 61.31], ["hum", 6.56], ["speech", 4.01]], null, null, null, null, null, null, null, null, null, null, [["music", 42.27], ["speech", 8.03], ["sonar", 4.43]], null, null, null, [["throbbing", 41.93], ["music", 31.69], ["hum", 5.18]], null, null, [["music", 50.8], ["throbbing", 15.11], ["speech", 8.78]], null, [["music", 53.75], ["insect", 10.21], ["fly, housefly", 10.08]]], "duration": [1.21, 18.68, 0.66, 0.2, 0.68, 0.2, 1.19, 1.4, 0.62, 0.24, 1.13, 1.0, 3.64, 0.44, 1.3, 0.14, 2.68, 0.71, 0.5, 4.24, 0.88, 15.57]} \ No newline at end of file diff --git a/annotations_filtered/iY68ovrzfXc_filtered.json b/annotations_filtered/iY68ovrzfXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd77e6f5e49235f0aeb6698a9c6e4d00e64f7bdc --- /dev/null +++ b/annotations_filtered/iY68ovrzfXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [8.0, 10.56], [12.0, 12.56], [14.0, 15.55], [18.0, 19.67], [25.0, 26.22], [28.0, 28.21], [31.0, 31.67], [35.0, 36.53], [40.0, 42.2], [43.0, 44.74], [53.0, 54.63], [56.0, 56.71], [57.0, 57.92], [62.0, 64.13], [65.0, 70.7], [80.0, 87.54], [89.0, 95.88], [97.0, 97.5], [99.0, 99.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 77.2, 54.36, 55.96, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 2.56, 0.56, 1.55, 1.67, 1.22, 0.21, 0.67, 1.53, 2.2, 1.74, 1.63, 0.71, 0.92, 2.13, 5.7, 7.54, 6.88, 0.5, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/iYG8WCULpNM_filtered.json b/annotations_filtered/iYG8WCULpNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87818fce1bbf8d7285932ada1b1bcd8d1b651218 --- /dev/null +++ b/annotations_filtered/iYG8WCULpNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.07], [8.0, 9.49], [11.0, 12.06], [14.0, 14.81], [16.0, 19.09], [20.0, 21.47], [22.0, 24.02], [30.0, 30.37], [34.0, 34.15], [36.0, 45.81], [47.0, 50.14], [51.0, 62.63], [64.0, 66.39], [67.0, 68.82], [70.0, 70.38], [71.0, 72.35], [73.0, 73.16], [73.0, 74.97], [78.0, 79.73], [81.0, 81.46], [87.0, 88.38], [91.0, 92.42], [94.0, 95.0], [96.0, 98.76], [104.0, 107.1], [111.0, 113.19], [114.0, 115.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.62, 0.0, 40.61, 0.0, 0.0, 32.77, 45.92, 46.86, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 36.17, 35.84, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 71.55], ["musical instrument", 4.06], ["guitar", 3.95]], null, [["music", 39.78], ["didgeridoo", 24.75], ["speech", 11.19]], null, null, [["music", 85.3], ["electronic music", 1.55], ["musical instrument", 1.47]], [["coin (dropping)", 32.55], ["thunk", 19.04], ["music", 8.54]], [["speech", 54.04], ["doorbell", 18.07], ["music", 12.23]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.29], ["chirp tone", 13.53], ["sidetone", 13.22]], [["music", 67.35], ["synthesizer", 8.16], ["drum machine", 4.85]], [["music", 53.07], ["synthesizer", 20.07], ["musical instrument", 4.44]], null], "duration": [1.07, 1.49, 1.06, 0.81, 3.09, 1.47, 2.02, 0.37, 0.15, 9.81, 3.14, 11.63, 2.39, 1.82, 0.38, 1.35, 0.16, 1.97, 1.73, 0.46, 1.38, 1.42, 1.0, 2.76, 3.1, 2.19, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/iYP5-Dl3rhg_filtered.json b/annotations_filtered/iYP5-Dl3rhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e5e204e70956d3eff1ba620266674d0aa223f9 --- /dev/null +++ b/annotations_filtered/iYP5-Dl3rhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 35.04], [40.0, 40.85], [44.0, 45.32], [54.0, 54.78], [57.0, 61.25], [62.0, 64.56], [68.0, 70.87], [75.0, 75.84], [77.0, 78.87], [80.0, 80.5], [82.0, 82.21], [83.0, 83.69], [86.0, 86.93], [90.0, 90.09], [91.0, 91.62], [92.0, 92.97], [95.0, 96.31], [97.0, 98.15], [100.0, 101.06], [102.0, 102.56], [104.0, 104.38], [105.0, 105.71], [108.0, 108.97], [110.0, 110.66], [111.0, 111.82], [114.0, 113.9], [117.0, 118.34], [119.0, 119.7], [123.0, 123.31], [124.0, 124.56], [127.0, 128.09], [129.0, 131.6], [133.0, 137.74], [138.0, 141.67], [142.0, 141.96], [142.0, 142.94], [150.0, 151.34], [155.0, 155.55], [161.0, 165.2], [169.0, 172.61], [173.0, 179.47]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.63, 31.95, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 37.84, 33.12, 0.0, 0.0, 0.0, 0.0, 33.67, 34.56, 34.49], "audiomae_on_audioset": [null, null, null, null, [["music", 31.12], ["applause", 21.44], ["crowd", 9.9]], [["speech", 33.51], ["applause", 7.24], ["cacophony", 5.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.34], ["radio", 21.0], ["sidetone", 1.99]], [["speech", 22.75], ["mains hum", 17.63], ["hum", 12.32]], null, null, null, null, [["bee, wasp, etc.", 31.76], ["fly, housefly", 17.82], ["insect", 13.25]], [["speech", 51.01], ["radio", 17.53], ["fly, housefly", 5.13]], [["music", 34.07], ["sidetone", 10.4], ["radio", 9.39]]], "duration": [1.04, 0.85, 1.32, 0.78, 4.25, 2.56, 2.87, 0.84, 1.87, 0.5, 0.21, 0.69, 0.93, 0.09, 0.62, 0.97, 1.31, 1.15, 1.06, 0.56, 0.38, 0.71, 0.97, 0.66, 0.82, -0.1, 1.34, 0.7, 0.31, 0.56, 1.09, 2.6, 4.74, 3.67, -0.04, 0.94, 1.34, 0.55, 4.2, 3.61, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/iYU7ltkHYXM_filtered.json b/annotations_filtered/iYU7ltkHYXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81925d667bfa70d1dfee5d3628d474951cf210c3 --- /dev/null +++ b/annotations_filtered/iYU7ltkHYXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [4.0, 6.93], [8.0, 8.4], [9.0, 10.1], [11.0, 13.66], [17.0, 17.71], [20.0, 20.29], [21.0, 21.63], [24.0, 27.28], [28.0, 32.73], [33.0, 37.32], [38.0, 49.49], [51.0, 53.6], [55.0, 55.27], [56.0, 62.23], [66.0, 66.78], [69.0, 71.17], [73.0, 74.36], [81.0, 81.82], [88.0, 89.31], [91.0, 91.72], [92.0, 92.7], [95.0, 100.4], [101.0, 102.57], [103.0, 104.48], [107.0, 112.77], [114.0, 113.97]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 62.07, 0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 60.6, 42.67, 37.52, 32.89, 48.27, 0.0, 52.62, 0.0, 46.64, 0.0, 0.0, 0.0, 0.0, 0.0, 48.19, 0.0, 0.0, 38.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 26.2], ["mains hum", 13.6], ["theremin", 11.93]], [["music", 56.82], ["theremin", 13.14], ["musical instrument", 6.32]], [["music", 37.82], ["brass instrument", 20.38], ["musical instrument", 8.65]], [["music", 25.28], ["speech", 13.55], ["mains hum", 9.99]], null, null, null, [["music", 33.18], ["speech", 13.45], ["musical instrument", 6.34]], null, null, null, null, null, [["music", 50.3], ["hum", 6.49], ["ambient music", 4.76]], null, null, [["music", 46.12], ["didgeridoo", 37.26], ["musical instrument", 3.14]], null], "duration": [1.1, 2.93, 0.4, 1.1, 2.66, 0.71, 0.29, 0.63, 3.28, 4.73, 4.32, 11.49, 2.6, 0.27, 6.23, 0.78, 2.17, 1.36, 0.82, 1.31, 0.72, 0.7, 5.4, 1.57, 1.48, 5.77, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/iYetsX9JdIU_filtered.json b/annotations_filtered/iYetsX9JdIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b87730823fd1206754575d7adba521481a8e05f --- /dev/null +++ b/annotations_filtered/iYetsX9JdIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [10.0, 10.52], [16.0, 16.68], [20.0, 20.9], [23.0, 24.04], [28.0, 28.61], [30.0, 30.65], [32.0, 33.67], [36.0, 37.59], [48.0, 48.79], [53.0, 53.89], [56.0, 57.82], [58.0, 58.99], [59.0, 59.8], [61.0, 61.96], [75.0, 75.05], [76.0, 76.11], [77.0, 77.73], [81.0, 81.24], [82.0, 82.81], [83.0, 85.9], [91.0, 91.54], [98.0, 98.27], [99.0, 99.33], [103.0, 105.0], [112.0, 114.69], [117.0, 118.25], [120.0, 120.46], [126.0, 126.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 53.47, 37.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.56], ["synthesizer", 8.66], ["musical instrument", 6.68]], null, null, null], "duration": [1.04, 0.52, 0.68, 0.9, 1.04, 0.61, 0.65, 1.67, 1.59, 0.79, 0.89, 1.82, 0.99, 0.8, 0.96, 0.05, 0.11, 0.73, 0.24, 0.81, 2.9, 0.54, 0.27, 0.33, 2.0, 2.69, 1.25, 0.46, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/iYsOzr1hPl8_filtered.json b/annotations_filtered/iYsOzr1hPl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a552163224a666e5c92354205c04bb10a4ce111b --- /dev/null +++ b/annotations_filtered/iYsOzr1hPl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.53], [14.0, 14.32], [17.0, 39.14], [40.0, 44.36], [45.0, 48.49], [49.0, 58.78], [59.0, 67.14], [68.0, 69.09], [69.0, 69.74], [79.0, 84.15], [84.0, 84.42], [85.0, 87.76], [89.0, 98.56], [102.0, 102.81]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.0, 99.95, 78.38, 99.98, 98.59, 0.0, 0.0, 100.0, 0.0, 99.59, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.6], ["music", 10.16], ["mains hum", 9.44]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.32, 22.14, 4.36, 3.49, 9.78, 8.14, 1.09, 0.74, 5.15, 0.42, 2.76, 9.56, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/iZx1W6cHw-g_filtered.json b/annotations_filtered/iZx1W6cHw-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d8d2299cb999daf0067e580071a7880c8db2a25 --- /dev/null +++ b/annotations_filtered/iZx1W6cHw-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.53], [6.0, 6.94], [50.0, 50.18], [69.0, 69.57], [70.0, 71.19], [72.0, 72.94], [92.0, 92.04], [95.0, 95.47], [101.0, 103.08], [104.0, 105.31], [111.0, 111.99], [114.0, 116.95], [118.0, 117.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 0.0, 40.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["animal", 23.22], ["frog", 20.06], ["speech", 5.46]], null], "duration": [2.53, 0.94, 0.18, 0.57, 1.19, 0.94, 0.04, 0.47, 2.08, 1.31, 0.99, 2.95, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/i_9C6d3VVHM_filtered.json b/annotations_filtered/i_9C6d3VVHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12dde76a8e8d65ef14c7ce9647534b83bd262078 --- /dev/null +++ b/annotations_filtered/i_9C6d3VVHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.83], [6.0, 6.22], [8.0, 9.78], [10.0, 10.96], [15.0, 16.28], [20.0, 22.42], [23.0, 24.78], [27.0, 28.39], [39.0, 38.91], [40.0, 40.34], [48.0, 50.33], [54.0, 54.46], [62.0, 63.78], [65.0, 64.64], [66.0, 65.77], [69.0, 70.14], [71.0, 78.49], [81.0, 89.53], [91.0, 91.25], [93.0, 92.89], [96.0, 96.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 34.75, 53.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.08], ["sidetone", 15.9], ["noise", 4.51]], null, null, null, null], "duration": [-0.17, 0.22, 1.78, 0.96, 1.28, 2.42, 1.78, 1.39, -0.09, 0.34, 2.33, 0.46, 1.78, -0.36, -0.23, 1.14, 7.49, 8.53, 0.25, -0.11, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/i_9mM4F_JVI_filtered.json b/annotations_filtered/i_9mM4F_JVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5664806c3b05c20f97f8469293a69335d377ecec --- /dev/null +++ b/annotations_filtered/i_9mM4F_JVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.93], [14.0, 14.1], [14.0, 14.93], [22.0, 30.59], [35.0, 35.92], [39.0, 39.66], [45.0, 55.53], [56.0, 58.26], [61.0, 81.45], [84.0, 85.5], [86.0, 87.45], [89.0, 90.21], [91.0, 93.43], [95.0, 104.13], [106.0, 106.68], [108.0, 109.31]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [45.24, 0.0, 0.0, 35.89, 0.0, 0.0, 31.82, 34.19, 30.47, 0.0, 0.0, 0.0, 43.64, 39.37, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 19.66], ["insect", 14.99], ["speech", 12.41]], null, null, [["speech", 88.04], ["radio", 2.1], ["animal", 1.38]], null, null, [["speech", 92.83], ["applause", 2.7], ["animal", 0.64]], [["speech", 26.81], ["clapping", 11.85], ["applause", 7.15]], [["speech", 56.03], ["vehicle", 7.94], ["boat, water vehicle", 6.66]], null, null, null, [["music", 35.34], ["speech", 28.22], ["sheep", 7.2]], [["speech", 20.81], ["music", 17.31], ["hum", 14.72]], null, null], "duration": [2.93, 0.1, 0.93, 8.59, 0.92, 0.66, 10.53, 2.26, 20.45, 1.5, 1.45, 1.21, 2.43, 9.13, 0.68, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/i_Rupd9NU4E_filtered.json b/annotations_filtered/i_Rupd9NU4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3602f2702df65413fd7d89a0cb90a101d43969c4 --- /dev/null +++ b/annotations_filtered/i_Rupd9NU4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.75], [11.0, 11.65], [20.0, 20.41], [26.0, 26.1], [33.0, 33.37], [34.0, 34.38], [36.0, 37.52], [39.0, 40.15], [45.0, 46.35], [47.0, 47.38], [48.0, 49.11], [72.0, 72.05], [73.0, 73.31], [75.0, 75.52], [76.0, 76.92], [80.0, 80.2], [82.0, 82.63], [86.0, 88.26], [92.0, 92.79], [101.0, 103.94], [111.0, 116.7], [118.0, 118.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.46, 0.0, 37.35, 29.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.14], ["throbbing", 9.53], ["hum", 5.42]], [["music", 36.49], ["speech", 17.75], ["vehicle", 7.78]], null], "duration": [0.75, 0.65, 0.41, 0.1, 0.37, 0.38, 1.52, 1.15, 1.35, 0.38, 1.11, 0.05, 0.31, 0.52, 0.92, 0.2, 0.63, 2.26, 0.79, 2.94, 5.7, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/i_SnR25Zoho_filtered.json b/annotations_filtered/i_SnR25Zoho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6974ccc113d40255881fc240010a9edfff77d48 --- /dev/null +++ b/annotations_filtered/i_SnR25Zoho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.28], [4.0, 8.02], [9.0, 12.5], [15.0, 16.9], [19.0, 21.2], [22.0, 23.7], [25.0, 25.56], [27.0, 27.26], [29.0, 30.42], [32.0, 32.29], [36.0, 36.51], [39.0, 40.42], [41.0, 45.17], [46.0, 48.34], [50.0, 50.82], [52.0, 53.82], [56.0, 56.46], [57.0, 58.56], [63.0, 63.68], [65.0, 65.79], [69.0, 69.11], [71.0, 72.98], [86.0, 88.25], [105.0, 105.53], [108.0, 109.14], [111.0, 110.98], [113.0, 113.21], [114.0, 115.43], [120.0, 120.6], [121.0, 121.78], [123.0, 122.89], [124.0, 124.44], [126.0, 128.87], [132.0, 132.02], [134.0, 134.4], [135.0, 135.92], [137.0, 137.07], [138.0, 138.23], [140.0, 139.87], [140.0, 141.22], [143.0, 143.19], [144.0, 145.27], [149.0, 149.13], [151.0, 151.53], [161.0, 162.89], [164.0, 164.17], [165.0, 169.16], [176.0, 176.18], [181.0, 180.67], [188.0, 188.28], [191.0, 191.02], [192.0, 193.62], [199.0, 200.69], [201.0, 201.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [80.11, 75.07, 99.98, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.65], ["throbbing", 20.9], ["music", 15.4]], null, null, null, null, null, null, null], "duration": [3.28, 4.02, 3.5, 1.9, 2.2, 1.7, 0.56, 0.26, 1.42, 0.29, 0.51, 1.42, 4.17, 2.34, 0.82, 1.82, 0.46, 1.56, 0.68, 0.79, 0.11, 1.98, 2.25, 0.53, 1.14, -0.02, 0.21, 1.43, 0.6, 0.78, -0.11, 0.44, 2.87, 0.02, 0.4, 0.92, 0.07, 0.23, -0.13, 1.22, 0.19, 1.27, 0.13, 0.53, 1.89, 0.17, 4.16, 0.18, -0.33, 0.28, 0.02, 1.62, 1.69, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/i_Y5UB3xxW8_filtered.json b/annotations_filtered/i_Y5UB3xxW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e01650aa7a6fec44b2bf744c467fd9da326d8ed --- /dev/null +++ b/annotations_filtered/i_Y5UB3xxW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.69], [14.0, 14.35], [17.0, 18.91], [20.0, 26.86], [27.0, 27.67], [29.0, 48.02], [49.0, 49.87], [55.0, 56.07], [58.0, 59.7], [60.0, 62.51], [64.0, 64.27], [65.0, 65.92], [66.0, 66.39], [66.0, 78.17], [88.0, 88.4], [90.0, 89.92], [93.0, 93.8], [105.0, 105.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [66.15, 0.0, 0.0, 97.43, 0.0, 99.98, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 37.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.36], ["music", 11.47], ["sidetone", 11.43]], null, null, null, null], "duration": [3.69, 0.35, 1.91, 6.86, 0.67, 19.02, 0.87, 1.07, 1.7, 2.51, 0.27, 0.92, 0.39, 12.17, 0.4, -0.08, 0.8, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/i_qI6LOc54w_filtered.json b/annotations_filtered/i_qI6LOc54w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3848fa003b1ba49e8f8ca24f99862a44acb0041b --- /dev/null +++ b/annotations_filtered/i_qI6LOc54w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.42], [12.0, 14.91], [18.0, 25.44], [29.0, 33.2], [34.0, 64.3], [66.0, 67.17], [77.0, 81.73], [83.0, 82.71], [88.0, 90.32], [93.0, 95.62], [96.0, 97.12], [101.0, 101.38], [107.0, 108.11], [109.0, 118.71], [124.0, 123.92], [130.0, 130.59], [163.0, 163.59], [173.0, 172.77], [175.0, 175.64], [179.0, 180.15], [185.0, 200.94]], "keep_status": [true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [40.99, 33.99, 36.25, 35.15, 0.0, 0.0, 49.97, 0.0, 61.37, 49.54, 0.0, 0.0, 0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.78], "audiomae_on_audioset": [[["music", 42.69], ["throbbing", 13.71], ["synthesizer", 11.92]], [["music", 68.49], ["throbbing", 3.37], ["hum", 2.14]], [["music", 85.61], ["musical instrument", 1.57], ["electronic music", 1.57]], [["music", 48.3], ["didgeridoo", 13.35], ["musical instrument", 2.49]], null, null, [["speech", 59.88], ["hum", 4.52], ["rowboat, canoe, kayak", 3.66]], null, null, [["speech", 30.71], ["sidetone", 24.64], ["music", 23.55]], null, null, null, [["throbbing", 34.91], ["hum", 29.36], ["music", 23.33]], null, null, null, null, null, null, [["boing", 33.05], ["music", 18.53], ["speech", 6.68]]], "duration": [7.42, 2.91, 7.44, 4.2, 30.3, 1.17, 4.73, -0.29, 2.32, 2.62, 1.12, 0.38, 1.11, 9.71, -0.08, 0.59, 0.59, -0.23, 0.64, 1.15, 15.94]} \ No newline at end of file diff --git a/annotations_filtered/i_rch_cy7dM_filtered.json b/annotations_filtered/i_rch_cy7dM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5533c8939b71ec263bba04a9272cf2a3d81ce275 --- /dev/null +++ b/annotations_filtered/i_rch_cy7dM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.75], [20.0, 21.47], [24.0, 25.1], [31.0, 31.48], [33.0, 39.56], [41.0, 43.92], [44.0, 44.79], [46.0, 53.25], [54.0, 58.82], [61.0, 81.8], [83.0, 84.64], [86.0, 95.4], [96.0, 96.89], [98.0, 98.31], [99.0, 113.58]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 89.72, 80.46, 0.0, 40.9, 38.5, 40.26, 0.0, 39.91, 0.0, 0.0, 34.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 73.03], ["brass instrument", 6.84], ["foghorn", 4.37]], [["music", 61.42], ["musical instrument", 6.73], ["brass instrument", 6.11]], [["music", 41.54], ["brass instrument", 19.92], ["trombone", 8.33]], null, [["music", 75.44], ["theremin", 6.47], ["didgeridoo", 4.28]], null, null, [["music", 56.1], ["brass instrument", 13.38], ["trombone", 7.08]]], "duration": [0.75, 1.47, 1.1, 0.48, 6.56, 2.92, 0.79, 7.25, 4.82, 20.8, 1.64, 9.4, 0.89, 0.31, 14.58]} \ No newline at end of file diff --git a/annotations_filtered/i_uA0oZ3xnI_filtered.json b/annotations_filtered/i_uA0oZ3xnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/i_uA0oZ3xnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/i_zdyGw0tEo_filtered.json b/annotations_filtered/i_zdyGw0tEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab073231207cb84f2df1730e87a97948bf1ca62a --- /dev/null +++ b/annotations_filtered/i_zdyGw0tEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.03], [21.0, 30.16], [31.0, 42.3], [45.0, 44.58], [46.0, 47.04], [50.0, 50.55], [52.0, 52.56], [53.0, 52.86], [56.0, 57.1], [64.0, 64.84], [71.0, 80.22], [84.0, 84.37], [85.0, 86.91], [90.0, 90.78], [96.0, 96.01], [99.0, 101.24], [105.0, 106.52], [110.0, 112.77], [114.0, 114.74], [116.0, 120.73], [125.0, 129.14], [130.0, 130.2], [130.0, 130.87], [132.0, 133.02], [135.0, 135.14], [137.0, 139.68], [143.0, 144.17], [145.0, 146.35], [147.0, 147.83], [150.0, 149.84], [151.0, 151.16], [152.0, 158.14], [159.0, 164.46], [167.0, 173.7], [177.0, 180.57], [182.0, 183.91], [193.0, 204.45]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [34.05, 32.91, 33.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 41.76, 0.0, 32.75, 0.0, 32.56, 32.05, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 31.95, 33.87, 31.55, 35.32, 0.0, 36.36], "audiomae_on_audioset": [[["music", 74.69], ["didgeridoo", 4.29], ["funny music", 1.32]], [["music", 56.01], ["speech", 4.36], ["whimper", 3.55]], [["music", 66.49], ["speech", 6.51], ["boing", 2.15]], null, null, null, null, null, null, null, [["music", 22.2], ["livestock, farm animals, working animals", 16.94], ["speech", 10.1]], null, null, null, null, [["music", 26.81], ["speech", 20.86], ["synthesizer", 10.85]], null, [["moo", 18.91], ["cattle, bovinae", 18.14], ["livestock, farm animals, working animals", 11.31]], null, [["music", 37.87], ["speech", 12.91], ["throbbing", 11.57]], [["music", 35.9], ["groan", 32.09], ["bleat", 3.5]], null, null, null, null, null, null, null, null, null, null, [["music", 45.9], ["didgeridoo", 7.98], ["theremin", 4.6]], [["livestock, farm animals, working animals", 36.54], ["cattle, bovinae", 23.93], ["music", 13.47]], [["music", 37.85], ["cattle, bovinae", 18.9], ["moo", 13.57]], [["speech", 49.23], ["music", 23.4], ["fart", 4.42]], null, [["theremin", 49.84], ["music", 35.32], ["musical instrument", 2.05]]], "duration": [16.03, 9.16, 11.3, -0.42, 1.04, 0.55, 0.56, -0.14, 1.1, 0.84, 9.22, 0.37, 1.91, 0.78, 0.01, 2.24, 1.52, 2.77, 0.74, 4.73, 4.14, 0.2, 0.87, 1.02, 0.14, 2.68, 1.17, 1.35, 0.83, -0.16, 0.16, 6.14, 5.46, 6.7, 3.57, 1.91, 11.45]} \ No newline at end of file diff --git a/annotations_filtered/iaCvBhskyk0_filtered.json b/annotations_filtered/iaCvBhskyk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8baa792b216c914305e85789569453e0e1c72f89 --- /dev/null +++ b/annotations_filtered/iaCvBhskyk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [3.0, 3.3], [5.0, 5.59], [6.0, 6.91], [9.0, 9.14], [10.0, 11.28], [12.0, 26.38], [28.0, 47.66], [51.0, 140.66], [141.0, 142.13], [143.0, 143.92], [145.0, 148.12], [150.0, 161.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 36.26, 0.0, 0.0, 0.0, 78.55, 64.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 31.06], ["heart sounds, heartbeat", 26.24], ["hum", 24.56]], null, null, null, null, null], "duration": [0.88, 0.3, 0.59, 0.91, 0.14, 1.28, 14.38, 19.66, 89.66, 1.13, 0.92, 3.12, 11.94]} \ No newline at end of file diff --git a/annotations_filtered/iaQdh-Hbp3I_filtered.json b/annotations_filtered/iaQdh-Hbp3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..049774f5f29e87f3d77ec5f7f2f5076f32f611b8 --- /dev/null +++ b/annotations_filtered/iaQdh-Hbp3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.77]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.77]} \ No newline at end of file diff --git a/annotations_filtered/iaTG4JflfqM_filtered.json b/annotations_filtered/iaTG4JflfqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c68023fcc0ba136605e85c1e7cc9848378d7ae0 --- /dev/null +++ b/annotations_filtered/iaTG4JflfqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [1.0, 1.32], [1.0, 1.92], [9.0, 9.93], [20.0, 20.33], [29.0, 30.69], [35.0, 37.91], [40.0, 41.28], [44.0, 44.58], [45.0, 46.31], [48.0, 48.84], [51.0, 52.56], [59.0, 58.67], [59.0, 62.21], [65.0, 65.16], [69.0, 70.65], [76.0, 77.84], [79.0, 79.03], [82.0, 82.32], [83.0, 83.2], [84.0, 85.6], [89.0, 89.5], [92.0, 93.04], [94.0, 96.38], [98.0, 99.4], [102.0, 102.91], [103.0, 102.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.02], ["speech", 6.07], ["crow", 4.76]], null, null, null], "duration": [0.21, 0.32, 0.92, 0.93, 0.33, 1.69, 2.91, 1.28, 0.58, 1.31, 0.84, 1.56, -0.33, 3.21, 0.16, 1.65, 1.84, 0.03, 0.32, 0.2, 1.6, 0.5, 1.04, 2.38, 1.4, 0.91, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/iamsdf-VSQI_filtered.json b/annotations_filtered/iamsdf-VSQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c83b18c6c72a7a815d7231ae4bb3ce5b2ea7fe8f --- /dev/null +++ b/annotations_filtered/iamsdf-VSQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.95], [3.0, 5.0], [11.0, 10.89], [13.0, 16.23], [17.0, 25.19], [26.0, 26.49], [27.0, 27.48], [29.0, 29.67], [35.0, 35.16], [36.0, 39.66], [41.0, 42.08], [44.0, 45.28], [46.0, 49.23], [50.0, 50.99], [52.0, 54.33], [57.0, 56.91], [59.0, 66.14], [67.0, 67.41], [68.0, 68.28], [68.0, 75.12], [76.0, 83.19], [85.0, 87.49], [89.0, 91.03], [92.0, 92.75], [94.0, 94.96], [95.0, 95.99], [96.0, 98.81], [100.0, 100.68], [101.0, 112.6], [115.0, 121.44], [122.0, 124.88], [126.0, 127.74]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.56, 0.0, 75.55, 83.34, 0.0, 0.0, 0.0, 0.0, 29.39, 0.0, 0.0, 33.09, 0.0, 60.23, 0.0, 58.13, 0.0, 0.0, 47.2, 45.05, 44.66, 49.64, 0.0, 0.0, 0.0, 55.67, 0.0, 66.76, 64.75, 50.66, 0.0], "audiomae_on_audioset": [null, [["hum", 14.18], ["mains hum", 12.09], ["sine wave", 10.93]], null, null, null, null, null, null, null, [["speech", 83.27], ["laughter", 2.94], ["male speech, man speaking", 1.86]], null, null, [["hum", 29.74], ["mains hum", 29.28], ["speech", 19.13]], null, null, null, null, null, null, [["hum", 48.45], ["mains hum", 21.14], ["radio", 13.25]], [["hum", 17.03], ["mains hum", 13.14], ["frog", 8.77]], [["hum", 31.74], ["mains hum", 13.05], ["radio", 11.95]], [["livestock, farm animals, working animals", 11.11], ["frog", 10.88], ["croak", 6.39]], null, null, null, null, null, null, null, null, null], "duration": [0.95, 2.0, -0.11, 3.23, 8.19, 0.49, 0.48, 0.67, 0.16, 3.66, 1.08, 1.28, 3.23, 0.99, 2.33, -0.09, 7.14, 0.41, 0.28, 7.12, 7.19, 2.49, 2.03, 0.75, 0.96, 0.99, 2.81, 0.68, 11.6, 6.44, 2.88, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/iaofBseh0J8_filtered.json b/annotations_filtered/iaofBseh0J8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ae0120444497728ba53071d9f880b13414c24d8 --- /dev/null +++ b/annotations_filtered/iaofBseh0J8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.68], [6.0, 6.12], [9.0, 9.66], [12.0, 12.6], [16.0, 16.73], [21.0, 21.57], [23.0, 24.26], [32.0, 32.34], [38.0, 39.04], [42.0, 43.56], [47.0, 47.29], [49.0, 49.49], [51.0, 51.98], [53.0, 53.79], [57.0, 57.18], [66.0, 66.19], [72.0, 72.66], [76.0, 76.25], [77.0, 77.68], [81.0, 83.02], [84.0, 85.11], [87.0, 87.86], [90.0, 90.68], [95.0, 95.71], [100.0, 100.53], [101.0, 101.93], [106.0, 106.69], [109.0, 109.73], [111.0, 111.99], [115.0, 117.27], [118.0, 119.53], [120.0, 121.69], [122.0, 122.98], [123.0, 126.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.57, 0.0, 0.0, 0.0, 43.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.02], ["hum", 21.36], ["mains hum", 9.12]], null, null, null, [["music", 52.84], ["speech", 17.3], ["inside, small room", 3.4]]], "duration": [1.68, 0.12, 0.66, 0.6, 0.73, 0.57, 1.26, 0.34, 1.04, 1.56, 0.29, 0.49, 0.98, 0.79, 0.18, 0.19, 0.66, 0.25, 0.68, 2.02, 1.11, 0.86, 0.68, 0.71, 0.53, 0.93, 0.69, 0.73, 0.99, 2.27, 1.53, 1.69, 0.98, 3.15]} \ No newline at end of file diff --git a/annotations_filtered/ib3Hn188Jwc_filtered.json b/annotations_filtered/ib3Hn188Jwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbc939adf0a3e2f302826f7a0a94fba12aef9914 --- /dev/null +++ b/annotations_filtered/ib3Hn188Jwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 63.71], [64.0, 64.96], [70.0, 72.13], [73.0, 75.42], [76.0, 77.18], [80.0, 81.51], [82.0, 85.11], [86.0, 86.0], [95.0, 96.13], [99.0, 99.64]], "keep_status": [true, false, false, false, false, false, true, false, false, false], "silence_prob": [34.88, 0.0, 38.95, 44.15, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 21.65], ["speech", 14.59], ["music", 8.03]], null, [["music", 79.69], ["didgeridoo", 2.53], ["musical instrument", 1.13]], [["mains hum", 34.5], ["hum", 31.81], ["music", 8.62]], null, null, [["mains hum", 33.96], ["hum", 30.54], ["music", 4.38]], null, null, null], "duration": [2.71, 0.96, 2.13, 2.42, 1.18, 1.51, 3.11, 0.0, 1.13, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/ibAU8weiUOI_filtered.json b/annotations_filtered/ibAU8weiUOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d653c669b820ef402bfc446cde611b794169db58 --- /dev/null +++ b/annotations_filtered/ibAU8weiUOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.44], [19.0, 18.99], [25.0, 30.54], [33.0, 35.18], [39.0, 41.08], [42.0, 42.58], [49.0, 49.52], [56.0, 55.66], [60.0, 75.36], [78.0, 82.34], [86.0, 86.85], [88.0, 89.33], [93.0, 95.62], [100.0, 104.95], [108.0, 109.51], [111.0, 113.22], [116.0, 116.97], [118.0, 118.05], [124.0, 125.04], [126.0, 126.71], [128.0, 137.51], [140.0, 140.61], [141.0, 142.75], [144.0, 144.53], [147.0, 150.6], [151.0, 172.42]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 28.99, 29.31, 30.78, 0.0, 0.0, 0.0, 30.45, 35.82, 0.0, 0.0, 47.31, 30.75, 0.0, 32.19, 0.0, 0.0, 0.0, 0.0, 28.57, 0.0, 0.0, 0.0, 35.68, 28.91], "audiomae_on_audioset": [null, null, [["music", 40.04], ["mains hum", 14.57], ["hum", 9.01]], [["music", 70.3], ["cacophony", 9.85], ["throbbing", 2.48]], [["music", 22.42], ["throbbing", 14.79], ["hum", 13.56]], null, null, null, [["hum", 56.24], ["mains hum", 26.32], ["throbbing", 12.57]], [["hum", 32.45], ["throbbing", 19.94], ["music", 19.73]], null, null, [["music", 56.45], ["throbbing", 8.34], ["hum", 6.5]], [["hum", 44.15], ["throbbing", 22.97], ["music", 13.06]], null, [["throbbing", 24.32], ["hum", 18.02], ["music", 9.83]], null, null, null, null, [["speech", 49.55], ["music", 21.8], ["throbbing", 6.48]], null, null, null, [["music", 31.5], ["throbbing", 22.07], ["hum", 9.88]], [["hum", 44.22], ["throbbing", 24.41], ["mains hum", 15.63]]], "duration": [0.44, -0.01, 5.54, 2.18, 2.08, 0.58, 0.52, -0.34, 15.36, 4.34, 0.85, 1.33, 2.62, 4.95, 1.51, 2.22, 0.97, 0.05, 1.04, 0.71, 9.51, 0.61, 1.75, 0.53, 3.6, 21.42]} \ No newline at end of file diff --git a/annotations_filtered/ibcYEwzgai8_filtered.json b/annotations_filtered/ibcYEwzgai8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ibcYEwzgai8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ibeJlYiMz9w_filtered.json b/annotations_filtered/ibeJlYiMz9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27d7d8a683073efd5dcb4568a0325dfbd7e4b576 --- /dev/null +++ b/annotations_filtered/ibeJlYiMz9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 40.44], [41.0, 59.53], [62.0, 94.36], [94.0, 97.11], [99.0, 101.71], [109.0, 109.92], [112.0, 114.66]], "keep_status": [true, true, false, true, true, false, false], "silence_prob": [32.48, 32.18, 0.0, 32.24, 45.85, 0.0, 94.52], "audiomae_on_audioset": [[["whale vocalization", 32.2], ["hum", 9.57], ["animal", 6.98]], [["speech", 15.93], ["livestock, farm animals, working animals", 15.73], ["hum", 11.0]], null, [["speech", 19.23], ["music", 10.91], ["mains hum", 7.73]], [["music", 35.5], ["throbbing", 13.15], ["hum", 7.1]], null, null], "duration": [23.44, 18.53, 32.36, 3.11, 2.71, 0.92, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/ic9PvDGkzf8_filtered.json b/annotations_filtered/ic9PvDGkzf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..311255c524ccb02a96634f94745f9165fdf87cb7 --- /dev/null +++ b/annotations_filtered/ic9PvDGkzf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 20.16], [22.0, 23.09], [26.0, 26.6], [28.0, 30.87], [33.0, 33.4], [35.0, 34.94], [38.0, 39.78], [40.0, 41.66], [46.0, 46.03], [49.0, 50.04], [51.0, 51.95], [53.0, 53.49], [58.0, 59.78], [61.0, 72.76], [76.0, 77.03], [80.0, 81.35], [82.0, 83.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.3, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.74], ["gong", 20.28], ["speech", 6.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.16, 1.09, 0.6, 2.87, 0.4, -0.06, 1.78, 1.66, 0.03, 1.04, 0.95, 0.49, 1.78, 11.76, 1.03, 1.35, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/iddBzE3syI4_filtered.json b/annotations_filtered/iddBzE3syI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f3792ff9500a61d721e0aced4cae748c37076e7 --- /dev/null +++ b/annotations_filtered/iddBzE3syI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.05], [18.0, 21.0], [23.0, 23.04], [23.0, 35.68], [38.0, 39.21], [41.0, 41.07], [41.0, 59.24], [60.0, 61.62], [65.0, 64.56]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.15, 0.0, 59.51, 0.0, 0.0, 63.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.05, 3.0, 0.04, 12.68, 1.21, 0.07, 18.24, 1.62, -0.44]} \ No newline at end of file diff --git a/annotations_filtered/idfa7VqkSOw_filtered.json b/annotations_filtered/idfa7VqkSOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a6fa0fbd308d4b5639a2c4066b9d982beb46dbf --- /dev/null +++ b/annotations_filtered/idfa7VqkSOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 61.45], [63.0, 63.49], [64.0, 70.17], [70.0, 84.4], [88.0, 88.6], [90.0, 90.68], [92.0, 93.39], [96.0, 99.33]], "keep_status": [false, false, true, false, false, false, false, true], "silence_prob": [31.74, 0.0, 31.21, 31.77, 0.0, 0.0, 0.0, 33.6], "audiomae_on_audioset": [[["music", 49.65], ["speech", 22.52], ["hum", 2.51]], null, [["music", 49.4], ["hum", 7.32], ["whale vocalization", 6.14]], [["music", 64.82], ["animal", 5.72], ["throbbing", 3.69]], null, null, null, [["music", 32.77], ["didgeridoo", 17.06], ["theremin", 5.9]]], "duration": [20.45, 0.49, 6.17, 14.4, 0.6, 0.68, 1.39, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/idvqLiOeLgc_filtered.json b/annotations_filtered/idvqLiOeLgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..682f369a6eea986dcb1039a78d0dd4b01e288fdc --- /dev/null +++ b/annotations_filtered/idvqLiOeLgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [8.0, 7.91], [9.0, 40.49], [49.0, 74.06], [92.0, 108.87], [111.0, 122.89], [128.0, 141.08], [144.0, 147.53], [151.0, 151.63], [152.0, 176.22], [179.0, 179.64]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.21, 29.91, 31.1, 30.37, 32.52, 0.0, 29.88, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.33], ["throbbing", 7.7], ["hum", 2.65]], [["music", 61.71], ["burst, pop", 4.65], ["bang", 3.09]], [["music", 68.67], ["speech", 9.08], ["didgeridoo", 5.02]], [["music", 48.88], ["groan", 10.76], ["buzz", 5.35]], [["music", 34.46], ["trombone", 33.17], ["brass instrument", 8.23]], null, [["music", 81.24], ["buzz", 2.43], ["cacophony", 1.67]], null], "duration": [-0.09, -0.09, 31.49, 25.06, 16.87, 11.89, 13.08, 3.53, 0.63, 24.22, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/idxHUQY4aDA_filtered.json b/annotations_filtered/idxHUQY4aDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..697e426ca9a910c189c1d00538678f0c9b913858 --- /dev/null +++ b/annotations_filtered/idxHUQY4aDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.73], [7.0, 8.23], [11.0, 12.8], [13.0, 14.82], [20.0, 20.61], [22.0, 23.68], [24.0, 24.63], [27.0, 27.08], [31.0, 30.91], [39.0, 39.06], [41.0, 41.79], [48.0, 48.37], [64.0, 64.42], [69.0, 70.26], [71.0, 72.39], [84.0, 83.93], [93.0, 96.28], [97.0, 98.36], [99.0, 98.86], [99.0, 99.57], [101.0, 101.21], [102.0, 103.13], [106.0, 106.68], [115.0, 115.35]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 35.06], ["hum", 15.93], ["music", 11.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.73, 1.23, 1.8, 1.82, 0.61, 1.68, 0.63, 0.08, -0.09, 0.06, 0.79, 0.37, 0.42, 1.26, 1.39, -0.07, 3.28, 1.36, -0.14, 0.57, 0.21, 1.13, 0.68, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/ie7XVOuzf2U_filtered.json b/annotations_filtered/ie7XVOuzf2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca1d9ab2a4b26fea2e8051d50f45f2a1fc84b157 --- /dev/null +++ b/annotations_filtered/ie7XVOuzf2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.75], [8.0, 10.35], [20.0, 31.77], [33.0, 34.3], [37.0, 38.87], [39.0, 40.2], [41.0, 45.01], [46.0, 49.35], [52.0, 54.06], [56.0, 57.99], [59.0, 58.65], [59.0, 60.37], [61.0, 82.0], [83.0, 86.86], [88.0, 91.07], [95.0, 96.35], [98.0, 98.44], [105.0, 110.47], [111.0, 113.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 99.99, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 99.95, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.75, 2.35, 11.77, 1.3, 1.87, 1.2, 4.01, 3.35, 2.06, 1.99, -0.35, 1.37, 21.0, 3.86, 3.07, 1.35, 0.44, 5.47, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/ieVPPV5S0Ps_filtered.json b/annotations_filtered/ieVPPV5S0Ps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbe48fe6f5ba7b606af0fdebd83b03ee5243d27f --- /dev/null +++ b/annotations_filtered/ieVPPV5S0Ps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 35.31], [38.0, 41.39], [42.0, 42.45], [42.0, 42.63], [43.0, 84.45], [88.0, 123.82], [126.0, 132.49]], "keep_status": [false, true, false, false, false, false, true], "silence_prob": [0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 31.0], "audiomae_on_audioset": [null, [["wild animals", 25.37], ["roaring cats (lions, tigers)", 19.26], ["animal", 11.88]], null, null, null, null, [["music", 40.9], ["hum", 18.72], ["mains hum", 10.29]]], "duration": [35.31, 3.39, 0.45, 0.63, 41.45, 35.82, 6.49]} \ No newline at end of file diff --git a/annotations_filtered/iedK7wzunWo_filtered.json b/annotations_filtered/iedK7wzunWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc960fb0a3e8b5a30bdbbd0a9fac4fff7c3d4aed --- /dev/null +++ b/annotations_filtered/iedK7wzunWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.81], [8.0, 7.92], [9.0, 18.86], [20.0, 20.02], [21.0, 21.54], [26.0, 26.81], [28.0, 28.51], [30.0, 61.11], [63.0, 86.51], [87.0, 87.35], [88.0, 91.23], [92.0, 92.47], [93.0, 93.36], [95.0, 98.66], [99.0, 99.76], [100.0, 102.25], [103.0, 106.46], [108.0, 107.86], [109.0, 109.41], [110.0, 121.61], [122.0, 123.18], [124.0, 124.63], [125.0, 125.41], [126.0, 127.65], [130.0, 130.6], [131.0, 131.97], [133.0, 139.28], [140.0, 153.69], [155.0, 155.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 40.12, 0.0, 99.05, 0.0, 0.0, 99.62, 0.0, 88.83, 99.16, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 76.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 75.28], ["hum", 4.54], ["noise", 2.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, -0.08, 9.86, 0.02, 0.54, 0.81, 0.51, 31.11, 23.51, 0.35, 3.23, 0.47, 0.36, 3.66, 0.76, 2.25, 3.46, -0.14, 0.41, 11.61, 1.18, 0.63, 0.41, 1.65, 0.6, 0.97, 6.28, 13.69, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/ielkiD8w-M8_filtered.json b/annotations_filtered/ielkiD8w-M8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..153dcaf0a208443ffb4b53601fc29aaf0eebdf1c --- /dev/null +++ b/annotations_filtered/ielkiD8w-M8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.41], [7.0, 14.28], [17.0, 62.29]], "keep_status": [true, true, false], "silence_prob": [39.43, 44.9, 0.0], "audiomae_on_audioset": [[["hum", 25.36], ["music", 17.24], ["mains hum", 10.88]], [["music", 33.66], ["hum", 23.79], ["mains hum", 6.48]], null], "duration": [2.41, 7.28, 45.29]} \ No newline at end of file diff --git a/annotations_filtered/if34bKbBqXI_filtered.json b/annotations_filtered/if34bKbBqXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a5f18611957d51647bac413c0f20b5163aae77f --- /dev/null +++ b/annotations_filtered/if34bKbBqXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.86], [11.0, 15.21], [20.0, 20.88], [22.0, 22.22], [30.0, 31.97], [34.0, 39.5], [41.0, 41.49], [43.0, 45.35], [47.0, 48.83], [51.0, 53.08], [54.0, 55.61], [57.0, 59.26], [63.0, 65.03], [66.0, 66.7], [68.0, 68.0], [70.0, 71.56], [72.0, 73.55], [75.0, 75.1], [77.0, 78.27], [82.0, 83.27], [85.0, 86.63], [88.0, 88.62], [89.0, 90.41], [93.0, 95.94], [97.0, 97.87], [99.0, 100.82], [104.0, 103.86], [107.0, 108.33], [114.0, 114.64], [119.0, 119.8], [122.0, 123.79], [124.0, 125.52], [126.0, 126.94], [128.0, 128.78], [131.0, 132.12], [133.0, 135.11], [137.0, 136.98], [138.0, 137.81], [139.0, 142.01], [144.0, 145.56], [147.0, 147.39], [148.0, 149.88], [151.0, 151.63], [154.0, 155.7], [160.0, 161.33], [166.0, 168.1], [170.0, 170.61], [172.0, 175.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.75, 0.0, 0.0, 0.0, 42.08, 0.0, 43.61, 0.0, 59.07, 0.0, 36.47, 35.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 52.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 69.2], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 43.5], ["moo", 31.84], ["livestock, farm animals, working animals", 21.54]], null, [["speech", 51.29], ["hum", 23.83], ["throbbing", 3.53]], null, null, null, [["cattle, bovinae", 41.36], ["moo", 28.22], ["livestock, farm animals, working animals", 25.4]], [["cattle, bovinae", 41.43], ["moo", 29.97], ["livestock, farm animals, working animals", 27.5]], null, null, null, null, null, null, null, null, null, null, [["speech", 48.95], ["music", 25.64], ["synthesizer", 3.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 4.21, 0.88, 0.22, 1.97, 5.5, 0.49, 2.35, 1.83, 2.08, 1.61, 2.26, 2.03, 0.7, 0.0, 1.56, 1.55, 0.1, 1.27, 1.27, 1.63, 0.62, 1.41, 2.94, 0.87, 1.82, -0.14, 1.33, 0.64, 0.8, 1.79, 1.52, 0.94, 0.78, 1.12, 2.11, -0.02, -0.19, 3.01, 1.56, 0.39, 1.88, 0.63, 1.7, 1.33, 2.1, 0.61, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/if5npkJHfik_filtered.json b/annotations_filtered/if5npkJHfik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fee5459e5600f7d258928603e64e977ed332a3f --- /dev/null +++ b/annotations_filtered/if5npkJHfik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.95], [11.0, 13.73], [14.0, 15.21], [16.0, 16.92], [20.0, 21.03], [22.0, 25.44], [26.0, 30.2], [31.0, 32.61], [37.0, 39.48], [40.0, 55.29], [58.0, 61.64], [62.0, 66.92], [68.0, 89.6], [91.0, 93.46], [94.0, 96.97], [102.0, 115.11]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 45.98, 0.0, 0.0, 0.0, 63.85, 35.09, 0.0, 72.75, 48.74, 38.72, 47.46, 53.1, 33.73, 36.19, 33.01], "audiomae_on_audioset": [null, [["hum", 16.82], ["music", 6.44], ["speech", 6.26]], null, null, null, null, [["mains hum", 41.64], ["hum", 30.38], ["speech", 5.63]], null, null, [["hum", 48.91], ["mains hum", 26.89], ["music", 11.24]], [["speech", 31.07], ["hum", 12.96], ["mains hum", 12.2]], [["hum", 48.97], ["throbbing", 17.2], ["mains hum", 15.68]], null, [["music", 33.15], ["theremin", 8.46], ["musical instrument", 5.96]], [["music", 24.17], ["ratchet, pawl", 4.62], ["gears", 4.42]], [["music", 46.87], ["cello", 12.29], ["musical instrument", 8.86]]], "duration": [1.95, 2.73, 1.21, 0.92, 1.03, 3.44, 4.2, 1.61, 2.48, 15.29, 3.64, 4.92, 21.6, 2.46, 2.97, 13.11]} \ No newline at end of file diff --git a/annotations_filtered/ifG_E9BKfuc_filtered.json b/annotations_filtered/ifG_E9BKfuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a1b7185fcb3954e0c9b7caf72ab5d5ec0c33996 --- /dev/null +++ b/annotations_filtered/ifG_E9BKfuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.07], [8.0, 9.41], [14.0, 15.63], [16.0, 17.09], [18.0, 19.18], [23.0, 23.46], [27.0, 27.16], [37.0, 38.47], [39.0, 40.14], [41.0, 43.04], [43.0, 44.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 77.89], ["musical instrument", 5.65], ["guitar", 3.01]], null], "duration": [0.07, 1.41, 1.63, 1.09, 1.18, 0.46, 0.16, 1.47, 1.14, 2.04, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/ifYK21xsVtI_filtered.json b/annotations_filtered/ifYK21xsVtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23669d2c0c7934e234af2e4979d32e631622269c --- /dev/null +++ b/annotations_filtered/ifYK21xsVtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.47], [5.0, 5.59], [7.0, 7.62], [9.0, 9.64], [11.0, 11.82], [15.0, 15.38], [18.0, 17.86], [25.0, 29.13]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 22.02], ["whale vocalization", 10.49], ["fly, housefly", 9.95]]], "duration": [1.47, 0.59, 0.62, 0.64, 0.82, 0.38, -0.14, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/ifkYHEoe6_k_filtered.json b/annotations_filtered/ifkYHEoe6_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..990db7355741d3f77bffd48e9278ab3251826139 --- /dev/null +++ b/annotations_filtered/ifkYHEoe6_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [24.0, 24.36], [26.0, 26.27], [31.0, 31.26], [41.0, 41.12], [44.0, 44.91], [47.0, 48.0], [55.0, 56.05], [57.0, 57.59], [60.0, 60.56], [66.0, 66.51], [67.0, 68.13], [69.0, 69.75], [78.0, 78.53], [80.0, 81.5], [83.0, 84.74], [88.0, 88.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.36, 0.27, 0.26, 0.12, 0.91, 1.0, 1.05, 0.59, 0.56, 0.51, 1.13, 0.75, 0.53, 1.5, 1.74, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/ig80r0pbEv4_filtered.json b/annotations_filtered/ig80r0pbEv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e44298197982c76d6b722b4cd24c13fd380a4fa --- /dev/null +++ b/annotations_filtered/ig80r0pbEv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 36.73], [42.0, 44.68], [45.0, 44.71], [45.0, 44.76], [45.0, 44.85], [51.0, 81.87], [82.0, 81.9], [82.0, 111.82], [116.0, 118.45], [119.0, 122.82]], "keep_status": [false, false, false, false, false, false, false, true, false, true], "silence_prob": [50.26, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 46.43, 50.61, 31.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 34.28], ["hum", 15.69], ["mains hum", 10.48]], null, [["hum", 20.88], ["mains hum", 20.32], ["music", 20.12]]], "duration": [20.73, 2.68, -0.29, -0.24, -0.15, 30.87, -0.1, 29.82, 2.45, 3.82]} \ No newline at end of file diff --git a/annotations_filtered/igEO_oyUs6U_filtered.json b/annotations_filtered/igEO_oyUs6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8beded7cc1ee75c349979925bb72d299858a09ca --- /dev/null +++ b/annotations_filtered/igEO_oyUs6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.21], [18.0, 20.33], [21.0, 22.22], [23.0, 38.79], [40.0, 44.96], [45.0, 64.93], [66.0, 67.66], [69.0, 112.63], [114.0, 116.36]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.4, 0.0, 47.27, 45.02, 32.89, 0.0, 0.0, 60.98], "audiomae_on_audioset": [null, null, null, [["hum", 59.01], ["mains hum", 14.43], ["throbbing", 12.66]], [["music", 59.16], ["synthesizer", 6.2], ["hum", 5.65]], [["music", 47.63], ["mains hum", 15.84], ["hum", 10.75]], null, null, null], "duration": [1.21, 2.33, 1.22, 15.79, 4.96, 19.93, 1.66, 43.63, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/iga0_T5B8dU_filtered.json b/annotations_filtered/iga0_T5B8dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58f9ce3b0d1724ccbe48eb296c535f4c2dc8d2bb --- /dev/null +++ b/annotations_filtered/iga0_T5B8dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [14.0, 15.4], [24.0, 26.32], [28.0, 29.25], [31.0, 35.01], [38.0, 46.13], [53.0, 55.86], [57.0, 61.2], [63.0, 74.7], [75.0, 74.76], [76.0, 84.05], [87.0, 96.5], [97.0, 97.23], [100.0, 108.41], [109.0, 109.19]], "keep_status": [false, false, false, false, true, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 36.17, 0.0, 40.26, 36.32, 35.92, 30.74, 31.86, 0.0, 30.81, 31.96, 0.0, 33.55, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 48.42], ["music", 19.02], ["theremin", 9.64]], null, [["music", 52.3], ["hum", 7.83], ["throbbing", 7.82]], [["mains hum", 50.2], ["hum", 33.81], ["music", 6.02]], [["music", 63.39], ["bleat", 11.12], ["sheep", 6.29]], [["bleat", 29.61], ["sheep", 18.52], ["livestock, farm animals, working animals", 16.68]], [["animal", 30.84], ["horse", 18.52], ["neigh, whinny", 17.52]], null, [["fart", 29.45], ["animal", 16.67], ["livestock, farm animals, working animals", 14.8]], [["animal", 32.76], ["roaring cats (lions, tigers)", 20.25], ["speech", 17.94]], null, [["fart", 19.89], ["speech", 11.96], ["animal", 11.38]], null], "duration": [0.69, 1.4, 2.32, 1.25, 4.01, 8.13, 2.86, 4.2, 11.7, -0.24, 8.05, 9.5, 0.23, 8.41, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/ih9NffWqWgM_filtered.json b/annotations_filtered/ih9NffWqWgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f98ad11cfd95f455e25a0f0998d44814f1155cd --- /dev/null +++ b/annotations_filtered/ih9NffWqWgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.75], [11.0, 14.08], [16.0, 17.98], [19.0, 26.54], [27.0, 31.78], [34.0, 37.22], [38.0, 44.79], [48.0, 67.09], [71.0, 133.47], [135.0, 136.19], [137.0, 138.82], [140.0, 141.03], [142.0, 143.02], [145.0, 145.61]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [72.31, 34.83, 0.0, 35.21, 30.73, 34.84, 32.39, 28.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.11], ["mains hum", 14.28], ["music", 14.12]], null, [["music", 48.79], ["hum", 20.53], ["mains hum", 7.23]], [["hum", 34.78], ["music", 22.96], ["mains hum", 16.45]], [["hum", 43.1], ["throbbing", 28.36], ["mains hum", 14.16]], [["hum", 54.05], ["throbbing", 25.75], ["mains hum", 17.47]], [["music", 37.19], ["cacophony", 23.9], ["noise", 3.97]], null, null, null, null, null, null], "duration": [2.75, 3.08, 1.98, 7.54, 4.78, 3.22, 6.79, 19.09, 62.47, 1.19, 1.82, 1.03, 1.02, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/ihKHvNOTcwk_filtered.json b/annotations_filtered/ihKHvNOTcwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565983128772759741c57c73b829693fdc057b76 --- /dev/null +++ b/annotations_filtered/ihKHvNOTcwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.94], [16.0, 16.9], [20.0, 22.84], [24.0, 38.5], [40.0, 41.03], [43.0, 65.67], [66.0, 79.83], [80.0, 81.94], [82.0, 86.07], [87.0, 89.29], [95.0, 95.18], [97.0, 97.34], [100.0, 100.38], [102.0, 104.4], [105.0, 105.54], [106.0, 106.66], [115.0, 125.64], [128.0, 137.89], [151.0, 152.04], [153.0, 166.6], [168.0, 168.52]], "keep_status": [true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [47.66, 0.0, 47.43, 35.8, 0.0, 30.99, 32.75, 0.0, 41.22, 78.89, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 33.43, 33.08, 0.0, 34.6, 0.0], "audiomae_on_audioset": [[["music", 61.62], ["soundtrack music", 4.05], ["synthesizer", 3.91]], null, [["fly, housefly", 64.98], ["insect", 16.88], ["mosquito", 14.11]], [["insect", 25.19], ["fly, housefly", 23.34], ["mosquito", 23.11]], null, [["speech", 35.74], ["music", 21.61], ["synthesizer", 5.04]], [["music", 30.95], ["groan", 15.24], ["sound effect", 6.59]], null, [["music", 27.87], ["speech", 11.11], ["animal", 7.12]], null, null, null, null, null, null, null, [["music", 60.76], ["boing", 13.18], ["speech", 4.1]], [["music", 55.28], ["fly, housefly", 11.33], ["insect", 4.67]], null, [["fly, housefly", 25.51], ["music", 22.82], ["fart", 6.77]], null], "duration": [2.94, 0.9, 2.84, 14.5, 1.03, 22.67, 13.83, 1.94, 4.07, 2.29, 0.18, 0.34, 0.38, 2.4, 0.54, 0.66, 10.64, 9.89, 1.04, 13.6, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/ihyRhFcUVto_filtered.json b/annotations_filtered/ihyRhFcUVto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39815f895ee6f2b1b64cb2c0d78c706566e08f86 --- /dev/null +++ b/annotations_filtered/ihyRhFcUVto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.29], [10.0, 9.98], [11.0, 11.43], [12.0, 13.36], [21.0, 20.68], [22.0, 22.52], [23.0, 26.55], [27.0, 27.55], [28.0, 29.25], [37.0, 38.6], [43.0, 42.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.29, -0.02, 0.43, 1.36, -0.32, 0.52, 3.55, 0.55, 1.25, 1.6, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/iiA0J5rKoE4_filtered.json b/annotations_filtered/iiA0J5rKoE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4973817273602dbccdb2c733284d868532f6da68 --- /dev/null +++ b/annotations_filtered/iiA0J5rKoE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.08], [0.0, 0.55], [11.0, 33.15], [38.0, 63.42], [64.0, 74.51], [81.0, 81.8], [82.0, 82.9], [89.0, 94.34], [96.0, 96.53], [97.0, 98.95], [100.0, 108.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 31.3, 30.33, 30.29, 0.0, 0.0, 33.75, 0.0, 0.0, 34.57], "audiomae_on_audioset": [null, null, [["music", 55.73], ["theremin", 17.28], ["musical instrument", 7.26]], [["music", 51.44], ["trombone", 20.2], ["brass instrument", 11.8]], [["music", 59.49], ["trombone", 14.04], ["brass instrument", 7.48]], null, null, [["fly, housefly", 14.71], ["whale vocalization", 14.28], ["hum", 10.63]], null, null, [["music", 24.7], ["buzz", 10.18], ["noise", 8.24]]], "duration": [0.08, 0.55, 22.15, 25.42, 10.51, 0.8, 0.9, 5.34, 0.53, 1.95, 8.78]} \ No newline at end of file diff --git a/annotations_filtered/iiMNb99KaYk_filtered.json b/annotations_filtered/iiMNb99KaYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..881052e4ce3594819e8a07bc18216400b5f88fd8 --- /dev/null +++ b/annotations_filtered/iiMNb99KaYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 37.18], [40.0, 42.43], [47.0, 86.29]], "keep_status": [true, false, false], "silence_prob": [29.36, 32.82, 0.0], "audiomae_on_audioset": [[["music", 19.56], ["throbbing", 10.18], ["bell", 7.03]], [["music", 63.82], ["throbbing", 12.73], ["hum", 7.41]], null], "duration": [6.18, 2.43, 39.29]} \ No newline at end of file diff --git a/annotations_filtered/iiUiiK9dMPg_filtered.json b/annotations_filtered/iiUiiK9dMPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/iiUiiK9dMPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/iioBwO6vnEs_filtered.json b/annotations_filtered/iioBwO6vnEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b3a1d00a422bbcbba520b3e0016fc283a5a1393 --- /dev/null +++ b/annotations_filtered/iioBwO6vnEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.44], [22.0, 23.68], [25.0, 25.46], [30.0, 31.99], [36.0, 37.32], [40.0, 42.72], [44.0, 45.49], [47.0, 48.96], [52.0, 57.2], [60.0, 62.04], [63.0, 65.99], [70.0, 69.77], [72.0, 71.78], [74.0, 76.42], [78.0, 81.11], [83.0, 83.76], [88.0, 88.57], [92.0, 95.94], [98.0, 98.46], [109.0, 111.81], [114.0, 123.31], [125.0, 126.18]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.54, 0.0, 0.0, 50.02, 39.96, 43.85, 0.0, 0.0, 45.3, 57.32, 0.0, 0.0, 43.0, 0.0, 42.76, 38.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 21.82], ["music", 17.19], ["mains hum", 11.94]], null, null, null, [["music", 60.83], ["theremin", 4.33], ["didgeridoo", 2.37]], [["music", 44.95], ["singing bowl", 14.5], ["musical instrument", 7.84]], null, null, [["music", 40.57], ["speech", 24.0], ["singing bowl", 8.99]], null, null, null, [["music", 27.53], ["speech", 22.91], ["synthesizer", 8.28]], null, [["music", 46.49], ["whale vocalization", 11.79], ["theremin", 6.65]], [["music", 47.67], ["hum", 9.19], ["mains hum", 7.09]], null], "duration": [0.44, 1.68, 0.46, 1.99, 1.32, 2.72, 1.49, 1.96, 5.2, 2.04, 2.99, -0.23, -0.22, 2.42, 3.11, 0.76, 0.57, 3.94, 0.46, 2.81, 9.31, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/ij0JLKDJOrc_filtered.json b/annotations_filtered/ij0JLKDJOrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8be65755a8a056692e4f4191053132b8741084 --- /dev/null +++ b/annotations_filtered/ij0JLKDJOrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 4.62], [5.0, 5.71], [9.0, 9.59], [10.0, 10.79], [20.0, 22.94], [30.0, 30.81], [34.0, 34.25], [35.0, 35.48], [38.0, 53.22], [60.0, 61.79], [92.0, 93.51], [95.0, 95.76]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 26.53], ["frog", 13.5], ["inside, small room", 5.07]], null, null, null, [["music", 51.76], ["speech", 18.73], ["tubular bells", 2.95]], null, null, null], "duration": [0.44, 0.62, 0.71, 0.59, 0.79, 2.94, 0.81, 0.25, 0.48, 15.22, 1.79, 1.51, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/ij3HAftwQQ0_filtered.json b/annotations_filtered/ij3HAftwQQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c825021f95853a0cdc3a50c6689ca92e383618ed --- /dev/null +++ b/annotations_filtered/ij3HAftwQQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.59], [20.0, 21.12], [24.0, 24.19], [29.0, 29.54], [31.0, 31.8], [51.0, 53.42], [55.0, 57.15], [58.0, 58.53], [62.0, 62.58], [64.0, 70.82], [72.0, 73.47], [78.0, 78.66]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [31.81, 0.0, 0.0, 0.0, 0.0, 36.64, 40.34, 0.0, 0.0, 32.32, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.5], ["hum", 26.35], ["mains hum", 11.52]], null, null, null, null, [["music", 35.35], ["speech", 12.06], ["musical instrument", 5.02]], [["music", 52.22], ["didgeridoo", 4.71], ["musical instrument", 4.7]], null, null, [["music", 50.81], ["didgeridoo", 6.18], ["percussion", 4.41]], null, null], "duration": [4.59, 1.12, 0.19, 0.54, 0.8, 2.42, 2.15, 0.53, 0.58, 6.82, 1.47, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/ijBU9q7fb3U_filtered.json b/annotations_filtered/ijBU9q7fb3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10538e3cd8f1af6637d1ab80fb6e2d3121847895 --- /dev/null +++ b/annotations_filtered/ijBU9q7fb3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [6.0, 8.01], [9.0, 9.95], [10.0, 10.45], [11.0, 13.54], [16.0, 16.48], [21.0, 21.39], [22.0, 22.76], [25.0, 25.51], [27.0, 27.06], [31.0, 31.16], [34.0, 34.79], [36.0, 36.86], [39.0, 39.41], [40.0, 40.69], [42.0, 43.6], [45.0, 45.59], [52.0, 55.11], [55.0, 56.84], [57.0, 57.92], [59.0, 59.75], [61.0, 61.53], [65.0, 65.37], [67.0, 67.53], [69.0, 71.41], [75.0, 75.03], [79.0, 80.15], [85.0, 85.87], [93.0, 96.04], [100.0, 119.5], [122.0, 130.32], [137.0, 137.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 47.27, 30.51, 29.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 20.91], ["moo", 13.95], ["cattle, bovinae", 13.27]], null, null, null, null, null, null, [["boing", 46.88], ["cattle, bovinae", 10.34], ["moo", 8.23]], null, null, null, [["speech", 19.34], ["explosion", 16.43], ["burst, pop", 12.08]], [["speech", 60.92], ["explosion", 6.62], ["music", 1.94]], [["vehicle", 52.33], ["car", 19.4], ["skidding", 9.43]], null], "duration": [1.04, 2.01, 0.95, 0.45, 2.54, 0.48, 0.39, 0.76, 0.51, 0.06, 0.16, 0.79, 0.86, 0.41, 0.69, 1.6, 0.59, 3.11, 1.84, 0.92, 0.75, 0.53, 0.37, 0.53, 2.41, 0.03, 1.15, 0.87, 3.04, 19.5, 8.32, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/ijXLPE7SB3c_filtered.json b/annotations_filtered/ijXLPE7SB3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b0ef256caec7ab32f06bca8a555304ceb6b973 --- /dev/null +++ b/annotations_filtered/ijXLPE7SB3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 35.94], [37.0, 43.8], [45.0, 45.45], [48.0, 49.55], [51.0, 70.7], [72.0, 78.88]], "keep_status": [true, false, false, false, true, false], "silence_prob": [32.07, 44.2, 0.0, 0.0, 43.51, 39.31], "audiomae_on_audioset": [[["music", 52.09], ["noise", 6.77], ["white noise", 4.23]], [["speech", 57.16], ["music", 18.62], ["fly, housefly", 1.79]], null, null, [["music", 32.8], ["hum", 11.73], ["mains hum", 8.89]], [["music", 30.99], ["speech", 21.32], ["throbbing", 18.94]]], "duration": [2.94, 6.8, 0.45, 1.55, 19.7, 6.88]} \ No newline at end of file diff --git a/annotations_filtered/ijaNlufpcMs_filtered.json b/annotations_filtered/ijaNlufpcMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..046ab8ee905e0183c1afa0b6f78adcfab16ebc9d --- /dev/null +++ b/annotations_filtered/ijaNlufpcMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [14.0, 47.06], [54.0, 105.38], [114.0, 126.89], [140.0, 140.51]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 82.74], ["cacophony", 5.61], ["musical instrument", 1.06]], null], "duration": [1.39, 33.06, 51.38, 12.89, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/ijrCSknWjeI_filtered.json b/annotations_filtered/ijrCSknWjeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d9bae3366532b6838a3b5097a0a48a38c19dea --- /dev/null +++ b/annotations_filtered/ijrCSknWjeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 67.17], [67.0, 76.54], [77.0, 76.64], [77.0, 81.94], [82.0, 114.64]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 38.72, 0.0, 36.87, 0.0], "audiomae_on_audioset": [null, [["music", 64.17], ["throbbing", 8.05], ["hum", 6.83]], null, [["music", 39.42], ["throbbing", 18.33], ["hum", 7.04]], null], "duration": [0.17, 9.54, -0.36, 4.94, 32.64]} \ No newline at end of file diff --git a/annotations_filtered/ik-n-L9UNTY_filtered.json b/annotations_filtered/ik-n-L9UNTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3517c4842e8a982b37c2922f58bf0d112ce4ad --- /dev/null +++ b/annotations_filtered/ik-n-L9UNTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.77], [30.0, 30.37], [31.0, 118.86], [120.0, 119.89], [120.0, 120.53], [121.0, 136.41]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.73], "audiomae_on_audioset": [null, null, null, null, null, [["music", 79.57], ["musical instrument", 3.61], ["didgeridoo", 2.56]]], "duration": [0.77, 0.37, 87.86, -0.11, 0.53, 15.41]} \ No newline at end of file diff --git a/annotations_filtered/ikWTYTomQI4_filtered.json b/annotations_filtered/ikWTYTomQI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0e10f163df54e9a8fcce0b92727747a42878bad --- /dev/null +++ b/annotations_filtered/ikWTYTomQI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [7.0, 12.19], [22.0, 22.25], [23.0, 24.06], [25.0, 30.37], [35.0, 58.5], [59.0, 59.44], [61.0, 61.84], [63.0, 63.41], [65.0, 65.6], [74.0, 78.29], [78.0, 78.38], [79.0, 79.76], [81.0, 81.5], [82.0, 94.15], [102.0, 102.98], [108.0, 118.12], [119.0, 122.45], [126.0, 127.04], [130.0, 130.42], [132.0, 132.97], [137.0, 138.4], [143.0, 144.36], [150.0, 152.54], [154.0, 154.36], [157.0, 157.2], [161.0, 161.08], [163.0, 164.29], [168.0, 171.46], [172.0, 178.68]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.15, 0.0, 0.0, 32.05, 30.98, 0.0, 0.0, 0.0, 0.0, 32.7, 0.0, 0.0, 0.0, 38.31, 0.0, 67.63, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 69.34, 98.59], "audiomae_on_audioset": [null, [["music", 30.2], ["musical instrument", 15.6], ["theremin", 14.95]], null, null, [["music", 38.03], ["didgeridoo", 24.33], ["theremin", 13.24]], [["music", 48.43], ["brass instrument", 16.49], ["trombone", 8.76]], null, null, null, null, [["music", 74.7], ["synthesizer", 5.25], ["musical instrument", 4.74]], null, null, null, [["music", 55.31], ["didgeridoo", 12.15], ["musical instrument", 7.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 5.19, 0.25, 1.06, 5.37, 23.5, 0.44, 0.84, 0.41, 0.6, 4.29, 0.38, 0.76, 0.5, 12.15, 0.98, 10.12, 3.45, 1.04, 0.42, 0.97, 1.4, 1.36, 2.54, 0.36, 0.2, 0.08, 1.29, 3.46, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/ik_WAfUpVKQ_filtered.json b/annotations_filtered/ik_WAfUpVKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91bb2461593728dea4be301b285fc0cacf115d06 --- /dev/null +++ b/annotations_filtered/ik_WAfUpVKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [16.0, 17.24], [31.0, 34.01], [49.0, 59.34], [62.0, 67.07], [73.0, 73.28], [80.0, 80.6], [83.0, 83.44], [87.0, 92.23], [105.0, 105.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.68, 33.53, 35.19, 0.0, 0.0, 0.0, 40.75, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.46], ["synthesizer", 22.07], ["cacophony", 6.86]], [["sidetone", 41.63], ["speech", 31.36], ["music", 8.31]], null, null, null, [["noise", 29.61], ["music", 24.87], ["sidetone", 16.43]], null], "duration": [0.67, 1.24, 3.01, 10.34, 5.07, 0.28, 0.6, 0.44, 5.23, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/ikcKKvKkf4Y_filtered.json b/annotations_filtered/ikcKKvKkf4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f87ca9e826e28891676e168b3857b125af398d4 --- /dev/null +++ b/annotations_filtered/ikcKKvKkf4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [12.0, 11.77], [17.0, 18.23], [19.0, 21.29], [22.0, 22.59], [24.0, 25.19], [26.0, 26.55], [37.0, 39.07], [40.0, 42.26], [44.0, 47.76], [52.0, 60.42], [61.0, 62.83], [63.0, 63.73], [65.0, 65.03], [67.0, 67.31], [70.0, 72.67], [73.0, 73.33], [81.0, 82.27], [83.0, 85.02], [91.0, 90.96], [105.0, 105.21], [107.0, 108.43], [119.0, 119.28], [121.0, 125.27], [140.0, 140.56], [151.0, 151.43], [153.0, 152.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 53.34, 58.13, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 29.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.63], ["cattle, bovinae", 7.37], ["livestock, farm animals, working animals", 7.35]], null, null, null], "duration": [-0.07, -0.23, 1.23, 2.29, 0.59, 1.19, 0.55, 2.07, 2.26, 3.76, 8.42, 1.83, 0.73, 0.03, 0.31, 2.67, 0.33, 1.27, 2.02, -0.04, 0.21, 1.43, 0.28, 4.27, 0.56, 0.43, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/ikfmhFpbWJk_filtered.json b/annotations_filtered/ikfmhFpbWJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa2f3992be9ee44180c7284facda9e4ebd27728a --- /dev/null +++ b/annotations_filtered/ikfmhFpbWJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [2.0, 2.93], [4.0, 5.8], [6.0, 7.72], [9.0, 10.02], [15.0, 17.41], [18.0, 20.65], [21.0, 22.03], [22.0, 38.16], [45.0, 44.52], [46.0, 45.91], [46.0, 45.98], [47.0, 52.52], [56.0, 57.87], [58.0, 60.25], [62.0, 67.27], [68.0, 70.19], [71.0, 73.75], [78.0, 80.65], [83.0, 93.87], [94.0, 95.39], [97.0, 97.41], [101.0, 103.22], [105.0, 105.68], [108.0, 110.64], [112.0, 113.31], [115.0, 117.14], [120.0, 120.53], [121.0, 125.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.43, 0.0, 96.29, 0.0, 0.0, 0.0, 92.97, 0.0, 98.27, 99.96, 99.99, 99.85, 71.0, 86.82, 0.0, 0.0, 99.98, 0.0, 99.26, 0.0, 100.0, 0.0, 99.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.93, 1.8, 1.72, 1.02, 2.41, 2.65, 1.03, 16.16, -0.48, -0.09, -0.02, 5.52, 1.87, 2.25, 5.27, 2.19, 2.75, 2.65, 10.87, 1.39, 0.41, 2.22, 0.68, 2.64, 1.31, 2.14, 0.53, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/ikqDLmNc678_filtered.json b/annotations_filtered/ikqDLmNc678_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1b0d06aef731a8402333aec93d2662bc6428778 --- /dev/null +++ b/annotations_filtered/ikqDLmNc678_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.14], [36.0, 39.58], [45.0, 45.77], [52.0, 62.82], [69.0, 74.43], [75.0, 83.27], [85.0, 85.24], [87.0, 88.06], [92.0, 92.25], [93.0, 93.19], [99.0, 99.72], [100.0, 102.46], [103.0, 113.78], [121.0, 134.65], [137.0, 143.26], [144.0, 144.85], [146.0, 146.65], [148.0, 154.8]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.18, 81.17, 0.0, 34.81, 50.71, 39.24, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 99.87, 98.93, 97.33, 0.0, 0.0, 97.22], "audiomae_on_audioset": [[["music", 43.95], ["fly, housefly", 4.17], ["clip-clop", 3.91]], null, null, [["speech", 51.4], ["vehicle", 11.56], ["car", 4.96]], null, [["speech", 40.19], ["explosion", 26.3], ["burst, pop", 5.05]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.14, 3.58, 0.77, 10.82, 5.43, 8.27, 0.24, 1.06, 0.25, 0.19, 0.72, 2.46, 10.78, 13.65, 6.26, 0.85, 0.65, 6.8]} \ No newline at end of file diff --git a/annotations_filtered/ikqLKMZ86d8_filtered.json b/annotations_filtered/ikqLKMZ86d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6227bb7c4d57674862f81e567ad386f8e063a173 --- /dev/null +++ b/annotations_filtered/ikqLKMZ86d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.05], [14.0, 22.13], [22.0, 23.13], [26.0, 26.23], [27.0, 27.41], [38.0, 39.43], [39.0, 39.46], [39.0, 41.99], [45.0, 48.42], [51.0, 51.92], [53.0, 53.16], [54.0, 55.54], [57.0, 60.34], [63.0, 66.5], [67.0, 69.36], [71.0, 74.21], [75.0, 74.85], [75.0, 83.22], [87.0, 87.35], [90.0, 90.17], [91.0, 94.85], [101.0, 106.08], [110.0, 115.03], [119.0, 118.79], [119.0, 119.97], [120.0, 120.95], [121.0, 121.69], [128.0, 128.24]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [40.12, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 38.9, 48.19, 0.0, 0.0, 0.0, 98.51, 50.11, 89.72, 47.27, 0.0, 33.48, 0.0, 0.0, 34.27, 33.37, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 17.75], ["mosquito", 12.7], ["speech", 12.46]], [["music", 28.86], ["speech", 12.66], ["animal", 8.67]], null, null, null, null, null, [["music", 50.55], ["speech", 22.48], ["boing", 16.66]], [["music", 47.77], ["frog", 7.83], ["animal", 6.13]], null, null, null, null, null, null, [["stomach rumble", 13.96], ["hum", 9.79], ["moo", 6.08]], null, [["speech", 83.53], ["screaming", 2.06], ["crying, sobbing", 1.19]], null, null, [["speech", 60.44], ["boing", 5.41], ["sidetone", 3.9]], [["animal", 32.49], ["domestic animals, pets", 12.24], ["dog", 10.53]], [["speech", 22.34], ["livestock, farm animals, working animals", 13.89], ["sidetone", 11.02]], null, null, null, null, null], "duration": [2.05, 8.13, 1.13, 0.23, 0.41, 1.43, 0.46, 2.99, 3.42, 0.92, 0.16, 1.54, 3.34, 3.5, 2.36, 3.21, -0.15, 8.22, 0.35, 0.17, 3.85, 5.08, 5.03, -0.21, 0.97, 0.95, 0.69, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/iktC8imMBnw_filtered.json b/annotations_filtered/iktC8imMBnw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e69a55ad3d3be917da02e32253e1a4b111ebd19 --- /dev/null +++ b/annotations_filtered/iktC8imMBnw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.78], [3.0, 31.28], [33.0, 37.32], [39.0, 39.36], [39.0, 39.58], [41.0, 42.63], [51.0, 54.5], [59.0, 61.86], [63.0, 63.26], [68.0, 68.64], [70.0, 74.88], [79.0, 79.89], [84.0, 85.85], [89.0, 99.4], [100.0, 112.53], [115.0, 117.05], [120.0, 120.7]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 29.95, 36.15, 0.0, 0.0, 0.0, 31.39, 39.88, 0.0, 0.0, 43.79, 0.0, 0.0, 30.96, 28.89, 35.72, 0.0], "audiomae_on_audioset": [null, [["music", 19.54], ["speech", 18.89], ["throbbing", 8.41]], [["frog", 16.62], ["croak", 14.75], ["music", 14.13]], null, null, null, [["music", 37.93], ["speech", 30.35], ["grunt", 7.04]], [["music", 19.58], ["frog", 17.23], ["croak", 16.02]], null, null, [["music", 75.92], ["didgeridoo", 8.3], ["musical instrument", 4.47]], null, null, [["music", 45.5], ["hum", 14.52], ["throbbing", 6.3]], [["music", 36.17], ["throbbing", 9.42], ["hum", 7.78]], [["hum", 45.52], ["throbbing", 40.96], ["music", 4.82]], null], "duration": [0.78, 28.28, 4.32, 0.36, 0.58, 1.63, 3.5, 2.86, 0.26, 0.64, 4.88, 0.89, 1.85, 10.4, 12.53, 2.05, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/il4NFf0V_HQ_filtered.json b/annotations_filtered/il4NFf0V_HQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dec61a282cb20a2c627c9a704759a14df85fdfee --- /dev/null +++ b/annotations_filtered/il4NFf0V_HQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.06], [10.0, 13.0], [14.0, 15.04], [17.0, 19.31], [21.0, 21.61], [24.0, 25.88], [28.0, 27.97], [30.0, 36.66], [38.0, 40.36], [67.0, 67.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.05, 0.0, 45.52, 0.0, 0.0, 0.0, 33.53, 51.23, 0.0], "audiomae_on_audioset": [null, [["hammer", 53.41], ["clang", 9.1], ["speech", 7.8]], null, [["fly, housefly", 54.77], ["insect", 26.24], ["bee, wasp, etc.", 15.14]], null, null, null, [["fly, housefly", 58.74], ["insect", 12.82], ["bee, wasp, etc.", 6.09]], null, null], "duration": [0.06, 3.0, 1.04, 2.31, 0.61, 1.88, -0.03, 6.66, 2.36, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/ilCjx9gigWI_filtered.json b/annotations_filtered/ilCjx9gigWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b7d2f28939730f239b471708aeef219a2d4c9f4 --- /dev/null +++ b/annotations_filtered/ilCjx9gigWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 25.32], [28.0, 27.75], [29.0, 32.86], [35.0, 38.18], [39.0, 40.83], [42.0, 44.32], [46.0, 47.43], [51.0, 53.59], [59.0, 58.83], [62.0, 62.09], [63.0, 63.54], [66.0, 67.53], [69.0, 69.04], [70.0, 70.7], [72.0, 72.55], [74.0, 74.28], [76.0, 76.32], [84.0, 85.09], [94.0, 96.33]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 97.11, 99.92, 0.0, 54.3, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1], "audiomae_on_audioset": [[["music", 38.48], ["theremin", 24.81], ["didgeridoo", 4.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.32, -0.25, 3.86, 3.18, 1.83, 2.32, 1.43, 2.59, -0.17, 0.09, 0.54, 1.53, 0.04, 0.7, 0.55, 0.28, 0.32, 1.09, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/ilG8mzbHNNI_filtered.json b/annotations_filtered/ilG8mzbHNNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85fa6b5edf3e8a0c81127d91f6b4685cd36cb774 --- /dev/null +++ b/annotations_filtered/ilG8mzbHNNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.37], [25.0, 26.2], [28.0, 34.91], [37.0, 36.9], [43.0, 44.25], [46.0, 53.11], [55.0, 83.03], [84.0, 96.96], [98.0, 98.46], [100.0, 100.72], [102.0, 106.12], [107.0, 117.68], [120.0, 120.68], [122.0, 122.37], [124.0, 131.52], [133.0, 136.05], [138.0, 137.56], [140.0, 141.42], [143.0, 144.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.64, 0.0, 0.0, 65.55, 36.22, 81.35, 0.0, 0.0, 94.07, 76.2, 0.0, 0.0, 90.08, 99.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 43.94], ["mains hum", 16.63], ["music", 15.68]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 1.2, 6.91, -0.1, 1.25, 7.11, 28.03, 12.96, 0.46, 0.72, 4.12, 10.68, 0.68, 0.37, 7.52, 3.05, -0.44, 1.42, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/ilR3_PaGoJA_filtered.json b/annotations_filtered/ilR3_PaGoJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f56ad7ae3c5aeecfb3adb5c077ad853144e31dd --- /dev/null +++ b/annotations_filtered/ilR3_PaGoJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 46.23], [51.0, 84.15], [86.0, 110.69], [112.0, 113.17], [114.0, 130.2]], "keep_status": [true, false, false, false, false], "silence_prob": [30.71, 0.0, 52.86, 0.0, 45.4], "audiomae_on_audioset": [[["throbbing", 20.29], ["hum", 18.45], ["music", 12.43]], null, null, null, [["music", 66.02], ["synthesizer", 6.73], ["ambient music", 6.52]]], "duration": [25.23, 33.15, 24.69, 1.17, 16.2]} \ No newline at end of file diff --git a/annotations_filtered/ilRq_PR6oi4_filtered.json b/annotations_filtered/ilRq_PR6oi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ee91601ccaadf047fff8e27cb1ee3c3957d6c8 --- /dev/null +++ b/annotations_filtered/ilRq_PR6oi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 71.52], [72.0, 75.34], [76.0, 78.63], [81.0, 83.51], [87.0, 89.45], [91.0, 128.78]], "keep_status": [true, true, true, true, true, false], "silence_prob": [30.42, 35.19, 37.67, 42.74, 42.08, 0.0], "audiomae_on_audioset": [[["music", 40.87], ["synthesizer", 16.83], ["musical instrument", 12.14]], [["music", 19.38], ["mains hum", 16.45], ["hum", 15.17]], [["music", 37.59], ["synthesizer", 16.13], ["hum", 12.05]], [["music", 41.9], ["hum", 8.39], ["mains hum", 7.02]], [["fly, housefly", 15.88], ["music", 14.19], ["insect", 11.89]], null], "duration": [26.52, 3.34, 2.63, 2.51, 2.45, 37.78]} \ No newline at end of file diff --git a/annotations_filtered/ilV5Qt01eyc_filtered.json b/annotations_filtered/ilV5Qt01eyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e227ee953ceda6cbc3b0892c926fa96c0ee350f5 --- /dev/null +++ b/annotations_filtered/ilV5Qt01eyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 55.88]], "keep_status": [false], "silence_prob": [29.35], "audiomae_on_audioset": [[["vehicle", 33.93], ["car", 22.3], ["race car, auto racing", 21.08]]], "duration": [8.88]} \ No newline at end of file diff --git a/annotations_filtered/ilXtCX0-CkE_filtered.json b/annotations_filtered/ilXtCX0-CkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58235276692975de656e0a89d03b5c8ffda9dfe9 --- /dev/null +++ b/annotations_filtered/ilXtCX0-CkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.34], [11.0, 11.65], [13.0, 13.14], [14.0, 14.3], [16.0, 16.48], [17.0, 18.12], [20.0, 24.53], [26.0, 26.81], [32.0, 41.07], [44.0, 45.28], [46.0, 46.62], [49.0, 51.6], [52.0, 58.14], [60.0, 63.68], [64.0, 70.02], [71.0, 72.37], [77.0, 77.65], [78.0, 79.96], [81.0, 81.21], [82.0, 84.84], [90.0, 90.34], [91.0, 91.61], [92.0, 109.83], [111.0, 111.52], [112.0, 114.54], [125.0, 128.85], [129.0, 131.14], [132.0, 134.01], [135.0, 138.54], [139.0, 139.38]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.16, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 99.99, 0.0, 0.0, 92.97, 82.97, 100.0, 98.44, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 84.98, 0.0, 95.78, 67.89, 63.64, 49.09, 69.2, 0.0], "audiomae_on_audioset": [[["thunk", 47.07], ["hum", 6.89], ["breaking", 6.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.46], ["music", 19.83], ["whale vocalization", 11.18]], null, null], "duration": [7.34, 0.65, 0.14, 0.3, 0.48, 1.12, 4.53, 0.81, 9.07, 1.28, 0.62, 2.6, 6.14, 3.68, 6.02, 1.37, 0.65, 1.96, 0.21, 2.84, 0.34, 0.61, 17.83, 0.52, 2.54, 3.85, 2.14, 2.01, 3.54, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/ilZqZaSUC0Y_filtered.json b/annotations_filtered/ilZqZaSUC0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37fc3bcdb5f0be401743c40c7fe3d48a0c02819 --- /dev/null +++ b/annotations_filtered/ilZqZaSUC0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 28.17], [29.0, 32.39], [33.0, 45.06], [47.0, 57.48], [62.0, 65.69], [70.0, 78.21], [79.0, 81.97], [84.0, 86.9], [88.0, 91.69], [95.0, 96.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 99.88, 100.0, 99.95, 93.13, 94.81, 99.76, 99.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [5.17, 3.39, 12.06, 10.48, 3.69, 8.21, 2.97, 2.9, 3.69, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/ilrpqagxBf4_filtered.json b/annotations_filtered/ilrpqagxBf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60b6dda92e3fe1c6f73c902f2c4877bf926fd471 --- /dev/null +++ b/annotations_filtered/ilrpqagxBf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.95], [19.0, 28.07], [29.0, 30.4], [32.0, 50.13], [51.0, 51.75], [54.0, 61.21]], "keep_status": [false, false, false, false, false, true], "silence_prob": [33.58, 29.97, 0.0, 31.97, 0.0, 31.25], "audiomae_on_audioset": [[["music", 88.35], ["musical instrument", 2.39], ["didgeridoo", 1.85]], [["speech", 43.48], ["music", 43.32], ["buzz", 2.1]], null, [["music", 59.12], ["speech", 9.51], ["throbbing", 5.51]], null, [["music", 49.59], ["throbbing", 6.9], ["hum", 6.05]]], "duration": [12.95, 9.07, 1.4, 18.13, 0.75, 7.21]} \ No newline at end of file diff --git a/annotations_filtered/iltOTKedsM0_filtered.json b/annotations_filtered/iltOTKedsM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bec839c05461b88229bc7229526fe782919a7d4d --- /dev/null +++ b/annotations_filtered/iltOTKedsM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.73], [3.0, 4.18], [6.0, 6.99], [8.0, 10.42], [17.0, 17.58], [21.0, 21.2], [23.0, 26.92], [28.0, 30.91], [32.0, 33.05], [33.0, 34.16], [36.0, 38.33], [40.0, 64.3], [65.0, 82.75], [89.0, 114.25], [116.0, 122.59], [123.0, 124.02], [125.0, 126.81]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 98.86, 95.64, 0.0, 0.0, 99.8, 32.04, 31.99, 31.62, 41.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 26.17], ["speech", 25.65], ["throbbing", 12.4]], null, null, null, null, null, null, null, [["gunshot, gunfire", 22.63], ["speech", 22.58], ["whack, thwack", 7.38]], [["music", 31.51], ["speech", 13.45], ["animal", 13.12]], [["music", 36.17], ["groan", 20.75], ["speech", 19.46]], [["music", 49.25], ["synthesizer", 10.97], ["musical instrument", 7.47]], null, null], "duration": [0.73, 1.18, 0.99, 2.42, 0.58, 0.2, 3.92, 2.91, 1.05, 1.16, 2.33, 24.3, 17.75, 25.25, 6.59, 1.02, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/im1ZK1WNBZs_filtered.json b/annotations_filtered/im1ZK1WNBZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93a6cb599bdc131cf2bfe0bf9d618a42d8e249f7 --- /dev/null +++ b/annotations_filtered/im1ZK1WNBZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.14], [18.0, 77.94], [80.0, 89.97], [90.0, 90.05], [90.0, 96.09], [100.0, 108.33], [111.0, 126.69]], "keep_status": [true, false, false, false, true, false, false], "silence_prob": [29.82, 0.0, 38.37, 0.0, 31.4, 33.05, 30.8], "audiomae_on_audioset": [[["music", 15.78], ["explosion", 15.35], ["burst, pop", 8.29]], null, [["throbbing", 56.3], ["hum", 17.84], ["music", 12.47]], null, [["hum", 33.96], ["throbbing", 18.41], ["mains hum", 9.02]], [["speech", 41.14], ["music", 29.01], ["throbbing", 6.74]], [["music", 40.62], ["speech", 32.58], ["hum", 3.27]]], "duration": [6.14, 59.94, 9.97, 0.05, 6.09, 8.33, 15.69]} \ No newline at end of file diff --git a/annotations_filtered/imcPspMbcL0_filtered.json b/annotations_filtered/imcPspMbcL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a789f8ef1ebe3dbb16dee30a40ae5b21e9570ad2 --- /dev/null +++ b/annotations_filtered/imcPspMbcL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.65], [15.0, 15.35], [22.0, 22.64], [26.0, 26.47], [31.0, 36.05], [42.0, 43.09], [45.0, 46.11], [52.0, 52.93], [61.0, 65.15], [71.0, 83.34], [91.0, 96.06], [102.0, 102.0], [102.0, 102.66], [107.0, 123.94], [127.0, 138.6], [142.0, 146.04]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.23, 0.0, 0.0, 0.0, 61.08, 31.29, 35.76, 0.0, 0.0, 32.23, 32.45, 36.09], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 43.45], ["hum", 36.48], ["throbbing", 3.25]], null, null, null, null, [["music", 39.88], ["throbbing", 13.81], ["hum", 13.72]], [["music", 32.0], ["throbbing", 25.44], ["hum", 12.05]], null, null, [["buzz", 45.42], ["music", 15.69], ["speech", 5.52]], [["breaking", 64.25], ["music", 7.16], ["buzz", 5.05]], [["whale vocalization", 35.63], ["crowd", 11.6], ["music", 8.5]]], "duration": [0.65, 0.35, 0.64, 0.47, 5.05, 1.09, 1.11, 0.93, 4.15, 12.34, 5.06, 0.0, 0.66, 16.94, 11.6, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/imyD8loUM-g_filtered.json b/annotations_filtered/imyD8loUM-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5766a2da132f77a5de56adab65c343cbc7dc0fe7 --- /dev/null +++ b/annotations_filtered/imyD8loUM-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [3.0, 3.65], [5.0, 7.97], [9.0, 9.68], [15.0, 14.81], [17.0, 30.91], [33.0, 41.4], [42.0, 43.16], [47.0, 49.65], [52.0, 52.64], [65.0, 75.05], [77.0, 83.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 64.07, 0.0, 0.0, 67.38, 51.5, 0.0, 44.55, 0.0, 40.97, 37.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 34.38], ["mains hum", 23.32], ["music", 17.98]], null, [["hum", 56.93], ["mains hum", 15.54], ["music", 6.68]], [["wind instrument, woodwind instrument", 31.74], ["music", 22.81], ["hum", 5.09]]], "duration": [0.25, 0.65, 2.97, 0.68, -0.19, 13.91, 8.4, 1.16, 2.65, 0.64, 10.05, 6.17]} \ No newline at end of file diff --git a/annotations_filtered/in-1BIg_Mec_filtered.json b/annotations_filtered/in-1BIg_Mec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38b1b4aedcd248142c811dcef6a977cddcf59193 --- /dev/null +++ b/annotations_filtered/in-1BIg_Mec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.0], [23.0, 23.82], [24.0, 29.12], [31.0, 40.24], [42.0, 42.04], [43.0, 45.91], [47.0, 62.19], [64.0, 64.89], [66.0, 66.7], [70.0, 69.69], [70.0, 71.29], [72.0, 72.91], [79.0, 82.31], [85.0, 85.04], [86.0, 88.42], [90.0, 98.86], [99.0, 117.0], [118.0, 122.98], [127.0, 133.98], [134.0, 134.01], [134.0, 141.34], [143.0, 175.31], [176.0, 177.5]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [60.89, 0.0, 50.21, 55.46, 0.0, 44.63, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 42.3, 50.97, 40.43, 52.27, 30.7, 0.0, 34.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.67], ["radio", 6.28], ["honk", 4.26]], null, null, null, null, null, null, null, null, [["speech", 58.82], ["sidetone", 30.09], ["whale vocalization", 1.7]], null, [["hum", 15.54], ["mains hum", 14.74], ["electric shaver, electric razor", 13.28]], null, [["speech", 50.37], ["music", 26.26], ["outside, urban or manmade", 1.58]], null, [["music", 53.72], ["speech", 13.35], ["theremin", 12.33]], null, null], "duration": [4.0, 0.82, 5.12, 9.24, 0.04, 2.91, 15.19, 0.89, 0.7, -0.31, 1.29, 0.91, 3.31, 0.04, 2.42, 8.86, 18.0, 4.98, 6.98, 0.01, 7.34, 32.31, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/in5f7RMtnoU_filtered.json b/annotations_filtered/in5f7RMtnoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b436b08008938ef686039b521853eb49dfa14446 --- /dev/null +++ b/annotations_filtered/in5f7RMtnoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.81], [17.0, 30.1], [32.0, 32.59], [33.0, 34.03], [35.0, 40.95], [42.0, 46.79], [48.0, 50.94], [54.0, 54.94], [56.0, 56.32], [57.0, 57.33], [65.0, 70.93], [77.0, 79.71], [81.0, 81.06], [81.0, 81.46], [82.0, 84.89], [85.0, 85.14], [86.0, 87.74], [89.0, 90.34], [91.0, 91.07], [96.0, 96.28], [97.0, 97.02], [97.0, 97.36], [101.0, 101.6], [103.0, 104.52], [105.0, 106.57], [109.0, 110.2], [111.0, 112.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.72, 53.65, 0.0, 0.0, 96.42, 81.35, 62.07, 0.0, 0.0, 0.0, 65.55, 90.08, 0.0, 0.0, 57.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.81, 13.1, 0.59, 1.03, 5.95, 4.79, 2.94, 0.94, 0.32, 0.33, 5.93, 2.71, 0.06, 0.46, 2.89, 0.14, 1.74, 1.34, 0.07, 0.28, 0.02, 0.36, 0.6, 1.52, 1.57, 1.2, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/inAlpz8a0aU_filtered.json b/annotations_filtered/inAlpz8a0aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd06aacceeb2a0395b383ac81aaa0f1d4dbcef4f --- /dev/null +++ b/annotations_filtered/inAlpz8a0aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.78], [3.0, 3.64], [5.0, 4.94], [19.0, 24.95], [27.0, 29.62], [31.0, 31.97], [34.0, 34.72], [41.0, 41.98], [44.0, 49.89], [53.0, 55.21], [57.0, 57.03], [57.0, 59.41], [60.0, 60.64], [64.0, 67.49], [69.0, 83.0], [84.0, 95.1], [96.0, 97.56], [103.0, 102.95], [106.0, 106.66], [108.0, 108.51], [110.0, 110.47], [114.0, 114.52], [119.0, 119.2], [120.0, 121.95], [128.0, 128.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.21, 99.97, 0.0, 0.0, 0.0, 81.53, 70.02, 0.0, 34.86, 0.0, 85.72, 42.39, 57.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 21.18], ["speech", 8.04], ["ding", 7.59]], null, null, [["music", 44.87], ["didgeridoo", 25.89], ["speech", 3.1]], null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 0.64, -0.06, 5.95, 2.62, 0.97, 0.72, 0.98, 5.89, 2.21, 0.03, 2.41, 0.64, 3.49, 14.0, 11.1, 1.56, -0.05, 0.66, 0.51, 0.47, 0.52, 0.2, 1.95, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/inDZp80Sq6U_filtered.json b/annotations_filtered/inDZp80Sq6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a0125cca1a9b30c9c2fcd94b25c49e96df63023 --- /dev/null +++ b/annotations_filtered/inDZp80Sq6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [4.0, 5.48], [8.0, 8.75], [11.0, 11.48], [17.0, 17.29], [19.0, 19.85], [24.0, 24.68], [26.0, 27.5], [29.0, 30.11], [37.0, 38.4], [40.0, 40.78], [47.0, 46.94], [54.0, 55.71], [57.0, 57.33], [61.0, 61.67], [65.0, 64.86], [68.0, 68.07], [69.0, 69.53], [71.0, 74.73], [76.0, 76.05], [76.0, 76.59], [77.0, 78.9], [81.0, 81.9], [84.0, 87.45], [91.0, 95.69], [97.0, 97.21], [98.0, 98.0], [100.0, 100.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 92.15, 85.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 1.48, 0.75, 0.48, 0.29, 0.85, 0.68, 1.5, 1.11, 1.4, 0.78, -0.06, 1.71, 0.33, 0.67, -0.14, 0.07, 0.53, 3.73, 0.05, 0.59, 1.9, 0.9, 3.45, 4.69, 0.21, 0.0, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/inrI2qvps58_filtered.json b/annotations_filtered/inrI2qvps58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8ea0fb2d5123e119182fb94fd3b4f87450af705 --- /dev/null +++ b/annotations_filtered/inrI2qvps58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.45], [7.0, 11.94], [15.0, 16.34], [17.0, 17.54], [18.0, 19.13], [20.0, 23.58], [34.0, 36.9], [38.0, 38.48], [41.0, 41.34], [43.0, 48.46], [50.0, 50.75], [53.0, 53.15], [56.0, 56.44], [60.0, 60.67], [65.0, 65.67], [66.0, 68.84], [70.0, 70.55], [71.0, 76.27], [86.0, 95.23], [96.0, 97.98], [99.0, 101.38]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [39.34, 42.88, 0.0, 0.0, 0.0, 41.03, 37.77, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 43.18, 35.16, 0.0, 56.33], "audiomae_on_audioset": [[["music", 27.25], ["speech", 27.09], ["synthesizer", 6.73]], [["music", 36.18], ["speech", 13.93], ["musical instrument", 4.25]], null, null, null, [["speech", 54.86], ["quack", 16.86], ["duck", 11.39]], [["sidetone", 30.01], ["speech", 23.72], ["hum", 6.75]], null, null, null, null, null, null, null, null, null, null, [["hum", 37.18], ["speech", 25.96], ["mains hum", 10.86]], [["speech", 34.38], ["music", 14.27], ["buzz", 7.21]], null, null], "duration": [2.45, 4.94, 1.34, 0.54, 1.13, 3.58, 2.9, 0.48, 0.34, 5.46, 0.75, 0.15, 0.44, 0.67, 0.67, 2.84, 0.55, 5.27, 9.23, 1.98, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/io-hA6pxffU_filtered.json b/annotations_filtered/io-hA6pxffU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35a4b238719209beaf6720af3808d4a5c53581d7 --- /dev/null +++ b/annotations_filtered/io-hA6pxffU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.47], [3.0, 2.54], [11.0, 12.02], [14.0, 14.62], [17.0, 18.12], [27.0, 27.4], [28.0, 28.98], [30.0, 30.92], [33.0, 33.42], [37.0, 37.4], [38.0, 38.82], [41.0, 43.14], [46.0, 48.05], [49.0, 49.27], [56.0, 55.76], [56.0, 57.35], [59.0, 59.46], [61.0, 61.38], [65.0, 66.65], [84.0, 84.1], [90.0, 91.64], [93.0, 93.46], [101.0, 102.54], [107.0, 109.78], [111.0, 110.86], [114.0, 113.9], [121.0, 120.9], [122.0, 121.81], [122.0, 123.57], [134.0, 134.01], [134.0, 139.28], [141.0, 141.99], [147.0, 146.97], [148.0, 148.2], [151.0, 151.17], [152.0, 152.46], [154.0, 155.12], [159.0, 159.36], [164.0, 168.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.85, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.87], "audiomae_on_audioset": [[["music", 49.45], ["boing", 20.46], ["speech", 10.39]], null, null, null, null, null, null, null, null, null, null, [["music", 27.75], ["speech", 17.69], ["synthesizer", 5.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 39.06], ["insect", 22.68], ["mosquito", 12.52]], null, null, null, null, null, null, null, [["cattle, bovinae", 28.39], ["moo", 25.62], ["speech", 19.27]]], "duration": [2.47, -0.46, 1.02, 0.62, 1.12, 0.4, 0.98, 0.92, 0.42, 0.4, 0.82, 2.14, 2.05, 0.27, -0.24, 1.35, 0.46, 0.38, 1.65, 0.1, 1.64, 0.46, 1.54, 2.78, -0.14, -0.1, -0.1, -0.19, 1.57, 0.01, 5.28, 0.99, -0.03, 0.2, 0.17, 0.46, 1.12, 0.36, 4.74]} \ No newline at end of file diff --git a/annotations_filtered/ioE_djgs810_filtered.json b/annotations_filtered/ioE_djgs810_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68ddd956f01a9b25db6b3beb2877cf2003d105b --- /dev/null +++ b/annotations_filtered/ioE_djgs810_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.47], [28.0, 156.12]], "keep_status": [false, false], "silence_prob": [30.22, 0.0], "audiomae_on_audioset": [[["music", 62.44], ["throbbing", 7.92], ["whack, thwack", 4.59]], null], "duration": [16.47, 128.12]} \ No newline at end of file diff --git a/annotations_filtered/ioKNba1RRys_filtered.json b/annotations_filtered/ioKNba1RRys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5549cce47d20e381400f554c12b97bad601b219a --- /dev/null +++ b/annotations_filtered/ioKNba1RRys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 26.25], [29.0, 29.69], [31.0, 31.4], [32.0, 49.0], [51.0, 50.95], [57.0, 59.27], [63.0, 64.5], [66.0, 68.81], [69.0, 70.7], [74.0, 163.86]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [28.69, 0.0, 0.0, 28.7, 0.0, 54.56, 0.0, 62.89, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.34], ["explosion", 8.27], ["boom", 4.47]], null, null, [["hum", 25.82], ["mains hum", 21.57], ["music", 12.49]], null, null, null, null, null, null], "duration": [6.25, 0.69, 0.4, 17.0, -0.05, 2.27, 1.5, 2.81, 1.7, 89.86]} \ No newline at end of file diff --git a/annotations_filtered/ioQQ3gbY0vY_filtered.json b/annotations_filtered/ioQQ3gbY0vY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ioQQ3gbY0vY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ioTMlrCoU2E_filtered.json b/annotations_filtered/ioTMlrCoU2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af6da9c9d764c9b85c085656282105d40ea08cc8 --- /dev/null +++ b/annotations_filtered/ioTMlrCoU2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [9.0, 9.54], [14.0, 15.21], [18.0, 19.53], [22.0, 23.09], [24.0, 26.54], [29.0, 30.92], [32.0, 33.83], [35.0, 38.47], [39.0, 40.53], [41.0, 41.71], [42.0, 42.94], [44.0, 63.8], [64.0, 71.52], [74.0, 76.2], [78.0, 80.47], [83.0, 83.25], [85.0, 87.59], [88.0, 87.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 29.94, 29.62, 48.23, 28.83, 0.0, 37.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fireworks", 20.89], ["music", 20.42], ["speech", 16.62]], [["speech", 46.41], ["explosion", 13.71], ["burst, pop", 9.24]], [["tick-tock", 7.17], ["hum", 6.76], ["speech", 5.48]], [["speech", 81.53], ["speech synthesizer", 6.83], ["male speech, man speaking", 2.49]], null, [["hum", 14.09], ["throbbing", 10.64], ["noise", 8.64]], null], "duration": [1.11, 0.54, 1.21, 1.53, 1.09, 2.54, 1.92, 1.83, 3.47, 1.53, 0.71, 0.94, 19.8, 7.52, 2.2, 2.47, 0.25, 2.59, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/ioUedV29CQE_filtered.json b/annotations_filtered/ioUedV29CQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2369a0cddb0e854a937d3fa46d9e62c5ffe8aa7b --- /dev/null +++ b/annotations_filtered/ioUedV29CQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.47], [8.0, 14.52], [16.0, 79.54], [80.0, 88.37], [89.0, 90.36], [91.0, 102.39]], "keep_status": [false, false, false, true, false, true], "silence_prob": [0.0, 56.1, 0.0, 34.2, 0.0, 37.63], "audiomae_on_audioset": [null, null, null, [["hum", 26.31], ["music", 15.28], ["throbbing", 14.86]], null, [["music", 50.86], ["sonar", 9.64], ["hum", 6.95]]], "duration": [1.47, 6.52, 63.54, 8.37, 1.36, 11.39]} \ No newline at end of file diff --git a/annotations_filtered/ioXW5Fg_q_g_filtered.json b/annotations_filtered/ioXW5Fg_q_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c1381b857b93291bc55ff861b74ea420a74f947 --- /dev/null +++ b/annotations_filtered/ioXW5Fg_q_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.82], [22.0, 22.13], [28.0, 29.0], [33.0, 34.67], [40.0, 48.84], [51.0, 52.44], [54.0, 53.92], [58.0, 62.21], [71.0, 75.49], [83.0, 90.71], [91.0, 101.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.74, 0.0, 0.0, 32.08, 37.21, 33.82, 32.11], "audiomae_on_audioset": [null, null, null, null, [["music", 79.6], ["yodeling", 8.92], ["singing", 2.0]], null, null, [["music", 80.07], ["theremin", 10.0], ["singing", 2.17]], [["music", 86.09], ["opera", 2.2], ["theremin", 2.13]], [["music", 90.9], ["singing", 2.26], ["humming", 1.03]], [["music", 85.41], ["opera", 5.45], ["classical music", 2.58]]], "duration": [0.82, 0.13, 1.0, 1.67, 8.84, 1.44, -0.08, 4.21, 4.49, 7.71, 10.7]} \ No newline at end of file diff --git a/annotations_filtered/iojZt-Ht4Nc_filtered.json b/annotations_filtered/iojZt-Ht4Nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bdfc6624d144b87374cac2ab8b2788c2b1ef1d3 --- /dev/null +++ b/annotations_filtered/iojZt-Ht4Nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.34], [15.0, 16.82], [18.0, 21.63], [24.0, 24.61], [26.0, 26.0], [29.0, 30.3], [31.0, 31.33], [33.0, 34.42], [35.0, 36.26], [39.0, 42.3], [43.0, 46.41], [50.0, 52.27], [53.0, 55.16], [61.0, 62.6], [65.0, 71.64], [76.0, 93.34], [95.0, 97.06], [100.0, 103.05], [105.0, 114.45], [115.0, 116.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.76, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 99.97, 99.78, 99.56, 0.0, 94.37, 94.81, 99.91, 99.1, 82.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.34, 1.82, 3.63, 0.61, 0.0, 1.3, 0.33, 1.42, 1.26, 3.3, 3.41, 2.27, 2.16, 1.6, 6.64, 17.34, 2.06, 3.05, 9.45, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/iotRit7KMDc_filtered.json b/annotations_filtered/iotRit7KMDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c003d9e6b09ef5e9914529c65bbd0e91822e2564 --- /dev/null +++ b/annotations_filtered/iotRit7KMDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [9.0, 8.58], [12.0, 11.82], [13.0, 13.46], [15.0, 15.23], [19.0, 19.79], [26.0, 27.77], [30.0, 35.82], [38.0, 45.2], [48.0, 48.96], [50.0, 50.8], [58.0, 58.4], [59.0, 63.12], [66.0, 67.95]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.17, 31.09, 0.0, 0.0, 0.0, 55.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 15.28], ["thunk", 12.77], ["doorbell", 8.93]], [["music", 65.36], ["speech", 9.92], ["bell", 2.6]], null, null, null, null, null], "duration": [1.24, -0.42, -0.18, 0.46, 0.23, 0.79, 1.77, 5.82, 7.2, 0.96, 0.8, 0.4, 4.12, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/ioznxKkY_IE_filtered.json b/annotations_filtered/ioznxKkY_IE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6232e46271c1e1fd87353d9126c54798e814b2b7 --- /dev/null +++ b/annotations_filtered/ioznxKkY_IE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [5.0, 7.23], [8.0, 9.31], [10.0, 11.37], [12.0, 13.66], [15.0, 16.6], [17.0, 19.2], [21.0, 22.98], [27.0, 27.77], [28.0, 30.89], [31.0, 36.96], [38.0, 41.3], [42.0, 43.09], [44.0, 46.77], [47.0, 47.85], [51.0, 52.52], [54.0, 54.72], [58.0, 61.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 64.86, 92.97, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 2.23, 1.31, 1.37, 1.66, 1.6, 2.2, 1.98, 0.77, 2.89, 5.96, 3.3, 1.09, 2.77, 0.85, 1.52, 0.72, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/ip1igmoPSD8_filtered.json b/annotations_filtered/ip1igmoPSD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a3ad34abbed78b72f3f56b7bd469efedbe922de --- /dev/null +++ b/annotations_filtered/ip1igmoPSD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [4.0, 6.35], [8.0, 10.13], [11.0, 11.79], [13.0, 14.25], [16.0, 16.83], [18.0, 19.67], [22.0, 23.73], [31.0, 32.43], [34.0, 35.36], [41.0, 41.1], [42.0, 41.72], [44.0, 48.69], [60.0, 60.94], [67.0, 67.73], [71.0, 75.0], [77.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 57.48, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 0.0, 34.01, 29.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 32.77], ["music", 27.12], ["hum", 23.59]], null, null, [["throbbing", 28.4], ["music", 25.63], ["hum", 16.46]], [["music", 53.62], ["didgeridoo", 6.96], ["theremin", 3.55]]], "duration": [0.6, 2.35, 2.13, 0.79, 1.25, 0.83, 1.67, 1.73, 1.43, 1.36, 0.1, -0.28, 4.69, 0.94, 0.73, 4.0, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/ipb0Bfg_FTs_filtered.json b/annotations_filtered/ipb0Bfg_FTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1e9e042d4666fa468cad848c080706f5ca3153e --- /dev/null +++ b/annotations_filtered/ipb0Bfg_FTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.08], [5.0, 10.23], [12.0, 12.9], [14.0, 16.01], [18.0, 20.51], [23.0, 40.22], [43.0, 43.8], [44.0, 56.34], [57.0, 58.04], [60.0, 71.96], [75.0, 75.36], [76.0, 76.89], [79.0, 79.91], [82.0, 84.03], [86.0, 125.2]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [66.63, 61.27, 0.0, 36.99, 68.67, 69.74, 0.0, 34.74, 0.0, 45.85, 0.0, 0.0, 0.0, 54.97, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 15.24], ["noise", 8.07], ["whale vocalization", 6.42]], null, null, null, [["speech", 38.82], ["music", 21.62], ["thump, thud", 5.16]], null, [["music", 61.56], ["speech", 12.63], ["didgeridoo", 12.43]], null, null, null, null, null], "duration": [2.08, 5.23, 0.9, 2.01, 2.51, 17.22, 0.8, 12.34, 1.04, 11.96, 0.36, 0.89, 0.91, 2.03, 39.2]} \ No newline at end of file diff --git a/annotations_filtered/ipc4KfTrRZs_filtered.json b/annotations_filtered/ipc4KfTrRZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6af5b2c16b456cc7ff5a402b7b43444581d981d4 --- /dev/null +++ b/annotations_filtered/ipc4KfTrRZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [1.0, 2.4], [17.0, 17.76], [26.0, 26.52], [27.0, 27.99], [29.0, 29.64], [31.0, 32.32], [36.0, 38.18], [39.0, 60.66], [63.0, 66.33], [69.0, 76.33], [80.0, 80.27], [88.0, 89.68], [91.0, 91.94], [101.0, 111.89], [113.0, 120.93], [122.0, 122.99], [124.0, 126.59], [128.0, 128.16], [129.0, 129.84], [134.0, 135.14], [137.0, 143.56], [146.0, 146.08], [147.0, 148.42], [150.0, 152.76], [154.0, 154.85], [155.0, 165.81], [166.0, 166.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 64.07, 44.29, 29.76, 0.0, 0.0, 0.0, 30.45, 59.68, 0.0, 65.44, 0.0, 0.0, 0.0, 31.87, 0.0, 0.0, 33.59, 0.0, 29.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 46.43], ["throbbing", 11.35], ["hum", 5.76]], [["music", 66.47], ["speech", 5.99], ["buzz", 2.81]], null, null, null, [["hum", 20.62], ["speech", 16.77], ["music", 10.03]], null, null, null, null, null, null, [["mains hum", 29.26], ["hum", 20.5], ["fly, housefly", 16.77]], null, null, [["sidetone", 78.31], ["noise", 6.32], ["speech", 2.28]], null, [["hum", 39.73], ["throbbing", 24.95], ["mains hum", 8.25]], null], "duration": [0.46, 1.4, 0.76, 0.52, 0.99, 0.64, 1.32, 2.18, 21.66, 3.33, 7.33, 0.27, 1.68, 0.94, 10.89, 7.93, 0.99, 2.59, 0.16, 0.84, 1.14, 6.56, 0.08, 1.42, 2.76, 0.85, 10.81, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/ipkF3xkP63M_filtered.json b/annotations_filtered/ipkF3xkP63M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b118208b950f60a5fe5cc38223d1e577a09a59e --- /dev/null +++ b/annotations_filtered/ipkF3xkP63M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [5.0, 5.78], [7.0, 7.2], [9.0, 10.22], [12.0, 12.9], [15.0, 15.03], [15.0, 17.9], [33.0, 33.88], [44.0, 45.79], [48.0, 52.47], [54.0, 54.8], [56.0, 57.16], [58.0, 59.53], [61.0, 61.79], [65.0, 66.02], [67.0, 68.23], [70.0, 70.34], [71.0, 74.29], [76.0, 76.99], [82.0, 83.47], [85.0, 90.8], [92.0, 94.86], [99.0, 98.98], [103.0, 102.98], [113.0, 114.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 67.13, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.78, 0.2, 1.22, 0.9, 0.03, 2.9, 0.88, 1.79, 4.47, 0.8, 1.16, 1.53, 0.79, 1.02, 1.23, 0.34, 3.29, 0.99, 1.47, 5.8, 2.86, -0.02, -0.02, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/iqLDCIZ1DIs_filtered.json b/annotations_filtered/iqLDCIZ1DIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..717d3ad70fadd7499d23b3da460a0621d67d7c32 --- /dev/null +++ b/annotations_filtered/iqLDCIZ1DIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 6.72], [11.0, 12.45], [32.0, 35.19], [37.0, 37.57], [41.0, 41.4], [44.0, 44.79], [46.0, 78.97], [81.0, 92.11], [95.0, 103.37], [106.0, 114.81], [118.0, 126.0], [127.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [34.22, 0.0, 38.33, 0.0, 0.0, 0.0, 0.0, 29.52, 33.02, 30.5, 29.71, 38.84], "audiomae_on_audioset": [[["throbbing", 47.84], ["hum", 31.36], ["heart sounds, heartbeat", 6.74]], null, [["hum", 40.25], ["whale vocalization", 22.73], ["throbbing", 16.18]], null, null, null, null, [["music", 58.09], ["throbbing", 10.48], ["speech", 6.54]], [["speech", 31.83], ["noise", 30.0], ["music", 11.23]], [["music", 23.14], ["didgeridoo", 20.47], ["noise", 13.66]], [["music", 48.23], ["sidetone", 12.05], ["speech", 7.45]], [["speech", 21.88], ["hum", 10.39], ["throbbing", 6.85]]], "duration": [6.72, 1.45, 3.19, 0.57, 0.4, 0.79, 32.97, 11.11, 8.37, 8.81, 8.0, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/iqZmwwUvgVU_filtered.json b/annotations_filtered/iqZmwwUvgVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae92d0c63c40719998526ce597cdb51498713472 --- /dev/null +++ b/annotations_filtered/iqZmwwUvgVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.02], [16.0, 17.2], [60.0, 60.57], [68.0, 74.09], [75.0, 75.46], [77.0, 82.44], [83.0, 91.39], [93.0, 101.63], [107.0, 109.65], [115.0, 120.01], [126.0, 127.13], [130.0, 131.08], [140.0, 142.48]], "keep_status": [true, false, false, false, false, true, true, true, true, false, false, false, true], "silence_prob": [28.76, 0.0, 0.0, 28.62, 0.0, 28.66, 29.29, 29.2, 29.08, 29.42, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["whale vocalization", 25.54], ["speech", 17.68], ["music", 7.46]], null, null, [["fly, housefly", 35.32], ["mosquito", 30.96], ["insect", 13.8]], null, [["vehicle", 16.27], ["speech", 15.77], ["outside, rural or natural", 4.03]], [["speech", 50.53], ["music", 6.07], ["groan", 5.82]], [["speech", 38.28], ["music", 22.12], ["explosion", 4.92]], [["groan", 54.19], ["speech", 4.42], ["music", 4.33]], [["music", 57.7], ["theremin", 12.51], ["mosquito", 5.57]], null, null, [["animal", 19.99], ["roaring cats (lions, tigers)", 11.84], ["wild animals", 10.4]]], "duration": [2.02, 1.2, 0.57, 6.09, 0.46, 5.44, 8.39, 8.63, 2.65, 5.01, 1.13, 1.08, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/iqyFc90L3zw_filtered.json b/annotations_filtered/iqyFc90L3zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58e6b95351a41369dfa881ee96f752f173de58ea --- /dev/null +++ b/annotations_filtered/iqyFc90L3zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.87], [10.0, 13.27], [15.0, 17.09], [20.0, 20.39], [22.0, 23.46], [27.0, 30.0], [32.0, 32.16], [34.0, 35.67], [42.0, 43.29], [49.0, 49.27], [61.0, 62.18], [64.0, 66.18], [73.0, 74.07], [75.0, 76.96], [82.0, 81.87], [83.0, 84.99], [85.0, 86.95], [89.0, 91.99], [97.0, 100.57], [103.0, 103.99], [105.0, 117.05], [117.0, 118.79], [123.0, 122.93], [125.0, 125.69], [129.0, 131.72], [147.0, 150.55], [152.0, 153.45], [155.0, 156.84]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.26, 49.27, 0.0, 0.0, 40.02, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 40.84, 50.91, 0.0, 50.31, 0.0, 0.0, 0.0, 56.63, 41.5, 0.0, 0.0], "audiomae_on_audioset": [null, [["fart", 82.81], ["groan", 4.27], ["sound effect", 2.8]], [["fly, housefly", 13.1], ["speech", 10.93], ["mosquito", 8.05]], null, null, [["tuning fork", 38.45], ["hum", 4.81], ["music", 4.79]], null, null, null, null, null, null, null, null, null, null, null, [["noise", 47.66], ["coin (dropping)", 22.5], ["effects unit", 4.7]], null, null, null, null, null, null, null, [["sidetone", 44.18], ["speech", 21.97], ["noise", 6.63]], null, null], "duration": [0.87, 3.27, 2.09, 0.39, 1.46, 3.0, 0.16, 1.67, 1.29, 0.27, 1.18, 2.18, 1.07, 1.96, -0.13, 1.99, 1.95, 2.99, 3.57, 0.99, 12.05, 1.79, -0.07, 0.69, 2.72, 3.55, 1.45, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/ir1sVy9JLyo_filtered.json b/annotations_filtered/ir1sVy9JLyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a655786dc58112ba0b154eb0dcf6d1277364ae14 --- /dev/null +++ b/annotations_filtered/ir1sVy9JLyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 59.48], [60.0, 60.83], [62.0, 64.13], [66.0, 67.61], [68.0, 68.59], [72.0, 72.82], [75.0, 77.89], [78.0, 81.36], [82.0, 88.32], [98.0, 103.86], [105.0, 105.97], [112.0, 112.26], [115.0, 117.02]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.91, 0.0, 51.88, 0.0, 0.0, 0.0, 82.07, 50.06, 36.94, 29.94, 0.0, 0.0, 38.71], "audiomae_on_audioset": [[["music", 32.82], ["speech", 30.72], ["breaking", 5.12]], null, null, null, null, null, null, null, [["hum", 35.76], ["music", 20.78], ["mains hum", 18.23]], [["gong", 23.86], ["boing", 17.06], ["speech", 6.95]], null, null, [["hum", 41.59], ["throbbing", 18.94], ["music", 13.56]]], "duration": [7.48, 0.83, 2.13, 1.61, 0.59, 0.82, 2.89, 3.36, 6.32, 5.86, 0.97, 0.26, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/irCUvLD1t5U_filtered.json b/annotations_filtered/irCUvLD1t5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6f15758ff638722a0d15ed2dab51f9c97b16bf7 --- /dev/null +++ b/annotations_filtered/irCUvLD1t5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 46.16], [48.0, 55.81], [57.0, 59.26], [62.0, 62.9], [64.0, 64.5], [65.0, 65.97], [67.0, 67.88], [69.0, 70.36], [73.0, 73.01], [75.0, 75.39], [77.0, 77.5], [82.0, 81.95], [83.0, 83.54], [96.0, 97.97], [101.0, 102.54], [143.0, 147.53], [169.0, 170.43], [174.0, 185.43], [187.0, 187.66]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.99, 64.18, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.17, 0.0, 34.22, 0.0], "audiomae_on_audioset": [[["vehicle", 15.43], ["hum", 15.31], ["aircraft", 8.6]], null, [["speech", 24.54], ["dial tone", 10.26], ["fly, housefly", 9.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.26], ["eruption", 8.96], ["whack, thwack", 7.11]], null], "duration": [2.16, 7.81, 2.26, 0.9, 0.5, 0.97, 0.88, 1.36, 0.01, 0.39, 0.5, -0.05, 0.54, 1.97, 1.54, 4.53, 1.43, 11.43, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/irQ89Ny0HkI_filtered.json b/annotations_filtered/irQ89Ny0HkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db5c10384170e78fb7efc94d5ce162d208622f35 --- /dev/null +++ b/annotations_filtered/irQ89Ny0HkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.67], [35.0, 45.99], [54.0, 62.02], [66.0, 70.66], [71.0, 71.32], [72.0, 72.76]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 35.27, 47.78, 35.02, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.03], ["sidetone", 20.17], ["speech", 13.31]], [["music", 34.71], ["speech", 16.93], ["mains hum", 11.54]], [["music", 56.13], ["theremin", 9.79], ["musical instrument", 7.2]], null, null], "duration": [0.67, 10.99, 8.02, 4.66, 0.32, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/irglCpn_Hs8_filtered.json b/annotations_filtered/irglCpn_Hs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01106428ca57171ce37f5d764b5b4630ecaf3df4 --- /dev/null +++ b/annotations_filtered/irglCpn_Hs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 19.38], [20.0, 24.81], [26.0, 26.54], [29.0, 30.21], [32.0, 32.95], [36.0, 43.63], [45.0, 46.47], [48.0, 49.11], [50.0, 51.31], [53.0, 74.12], [74.0, 81.18], [81.0, 100.01], [101.0, 111.47], [112.0, 117.85], [119.0, 120.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.32, 31.45, 0.0, 0.0, 0.0, 32.65, 0.0, 0.0, 0.0, 33.18, 32.79, 32.64, 31.68, 55.25, 0.0], "audiomae_on_audioset": [[["sidetone", 47.41], ["music", 19.56], ["speech", 9.46]], [["speech", 59.67], ["music", 21.23], ["musical instrument", 3.9]], null, null, null, [["speech", 52.52], ["music", 20.03], ["hum", 5.82]], null, null, null, [["music", 43.36], ["hum", 22.48], ["throbbing", 9.62]], [["sidetone", 40.73], ["speech", 19.62], ["hum", 15.79]], [["speech", 33.5], ["music", 14.37], ["didgeridoo", 8.74]], [["speech", 52.26], ["hum", 14.0], ["throbbing", 5.26]], null, null], "duration": [6.38, 4.81, 0.54, 1.21, 0.95, 7.63, 1.47, 1.11, 1.31, 21.12, 7.18, 19.01, 10.47, 5.85, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/irglc0zZbvA_filtered.json b/annotations_filtered/irglc0zZbvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6231c2252e5af4997a51b1698b7ec3ccbcdf8d5 --- /dev/null +++ b/annotations_filtered/irglc0zZbvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [5.0, 5.36], [7.0, 11.4], [12.0, 13.91], [19.0, 20.34], [21.0, 21.79], [25.0, 25.3], [26.0, 26.42], [27.0, 27.11], [29.0, 29.25], [32.0, 39.82], [41.0, 46.3], [47.0, 48.25], [52.0, 52.68], [54.0, 56.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.67, 49.27, 0.0, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 57.56], ["alarm clock", 8.27], ["buzzer", 6.92]], [["music", 38.39], ["hum", 8.72], ["sidetone", 8.39]], null, null, null], "duration": [1.04, 0.36, 4.4, 1.91, 1.34, 0.79, 0.3, 0.42, 0.11, 0.25, 7.82, 5.3, 1.25, 0.68, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/irhRobBI3BE_filtered.json b/annotations_filtered/irhRobBI3BE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1818367e94eeb9b23f0b856b3caa93122014d74b --- /dev/null +++ b/annotations_filtered/irhRobBI3BE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.71], [9.0, 10.13], [15.0, 20.51], [51.0, 50.87], [51.0, 52.52], [59.0, 111.67], [114.0, 127.55], [129.0, 130.67], [131.0, 156.41]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [59.24, 0.0, 68.02, 0.0, 0.0, 0.0, 30.65, 0.0, 31.88], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 61.98], ["hum", 17.12], ["mains hum", 7.65]], null, [["music", 51.01], ["speech", 34.5], ["synthesizer", 1.3]]], "duration": [2.71, 1.13, 5.51, -0.13, 1.52, 52.67, 13.55, 1.67, 25.41]} \ No newline at end of file diff --git a/annotations_filtered/irkGAhW7wlQ_filtered.json b/annotations_filtered/irkGAhW7wlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cbd1fd88d5e83ebe1687196d71eecef3ffc58dd --- /dev/null +++ b/annotations_filtered/irkGAhW7wlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.29], [12.0, 12.33], [13.0, 14.99], [17.0, 17.85], [23.0, 23.8], [29.0, 29.17], [31.0, 57.2], [58.0, 59.16], [60.0, 74.21], [75.0, 76.77], [83.0, 83.54], [86.0, 86.59], [95.0, 98.81], [104.0, 108.57], [110.0, 110.84], [112.0, 113.02], [114.0, 119.01], [121.0, 122.37], [123.0, 123.85], [125.0, 125.41], [126.0, 127.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 0.0, 84.8, 0.0, 0.0, 0.0, 99.78, 87.92, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.29, 0.33, 1.99, 0.85, 0.8, 0.17, 26.2, 1.16, 14.21, 1.77, 0.54, 0.59, 3.81, 4.57, 0.84, 1.02, 5.01, 1.37, 0.85, 0.41, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/irnb55gfwNc_filtered.json b/annotations_filtered/irnb55gfwNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..173e413e20ddaf38b0ca10fef43c4a52a3c9ac52 --- /dev/null +++ b/annotations_filtered/irnb55gfwNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [16.0, 43.88], [46.0, 46.57], [47.0, 50.4], [51.0, 61.37], [65.0, 76.22], [79.0, 82.43], [84.0, 84.87], [86.0, 111.82], [114.0, 115.65], [117.0, 118.99], [125.0, 126.47]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.08, 0.0, 49.27, 32.25, 34.99, 34.81, 0.0, 48.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 77.95], ["hum", 2.93], ["mains hum", 2.17]], null, [["music", 25.93], ["mains hum", 15.09], ["hum", 8.79]], [["music", 53.31], ["synthesizer", 9.77], ["gong", 5.23]], [["music", 58.0], ["synthesizer", 10.2], ["throbbing", 6.69]], [["music", 44.25], ["throbbing", 13.41], ["synthesizer", 13.23]], null, [["hum", 40.95], ["music", 16.11], ["mains hum", 14.62]], null, null, null], "duration": [0.4, 27.88, 0.57, 3.4, 10.37, 11.22, 3.43, 0.87, 25.82, 1.65, 1.99, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/irnju0G-lBg_filtered.json b/annotations_filtered/irnju0G-lBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590191f59a028aee525c9d1415a0587f50d2a2ec --- /dev/null +++ b/annotations_filtered/irnju0G-lBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.45], [15.0, 61.32], [62.0, 70.23], [71.0, 71.91], [73.0, 131.68], [136.0, 136.8], [139.0, 144.51], [146.0, 153.4], [154.0, 157.1], [161.0, 170.95], [171.0, 206.88], [208.0, 208.62], [214.0, 217.11], [219.0, 221.31], [222.0, 223.38], [224.0, 224.65], [226.0, 226.15], [227.0, 228.5], [232.0, 234.66], [237.0, 238.28], [243.0, 243.77]], "keep_status": [true, false, true, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [30.8, 0.0, 30.92, 0.0, 0.0, 0.0, 31.24, 33.76, 42.67, 85.72, 0.0, 0.0, 88.1, 46.09, 0.0, 0.0, 0.0, 0.0, 28.96, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.89], ["music", 16.57], ["sidetone", 5.28]], null, [["music", 41.79], ["speech", 10.65], ["foghorn", 6.82]], null, null, null, [["music", 25.97], ["theremin", 22.9], ["synthesizer", 13.3]], [["music", 23.02], ["whale vocalization", 17.33], ["synthesizer", 8.59]], [["music", 49.97], ["pulse", 7.52], ["didgeridoo", 5.14]], null, null, null, null, [["speech", 32.76], ["whale vocalization", 16.94], ["sine wave", 8.19]], null, null, null, null, [["moo", 12.76], ["cattle, bovinae", 9.61], ["livestock, farm animals, working animals", 7.25]], null, null], "duration": [2.45, 46.32, 8.23, 0.91, 58.68, 0.8, 5.51, 7.4, 3.1, 9.95, 35.88, 0.62, 3.11, 2.31, 1.38, 0.65, 0.15, 1.5, 2.66, 1.28, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/iropsnsCEjA_filtered.json b/annotations_filtered/iropsnsCEjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..767df24d427f7c60279b62d38b815658bb59d058 --- /dev/null +++ b/annotations_filtered/iropsnsCEjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.7], [20.0, 51.29], [52.0, 51.81], [60.0, 91.69], [122.0, 122.2], [124.0, 123.77], [125.0, 125.09], [131.0, 131.79], [133.0, 172.64], [176.0, 176.74], [178.0, 178.73], [192.0, 192.5], [202.0, 202.32], [205.0, 208.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.86], ["speech", 15.68], ["foghorn", 14.04]]], "duration": [3.7, 31.29, -0.19, 31.69, 0.2, -0.23, 0.09, 0.79, 39.64, 0.74, 0.73, 0.5, 0.32, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/irr4b40Ok7E_filtered.json b/annotations_filtered/irr4b40Ok7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/irr4b40Ok7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/is4ZtB0U7Vo_filtered.json b/annotations_filtered/is4ZtB0U7Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8abda3a737a041e823d2314c4787662a4c030f1 --- /dev/null +++ b/annotations_filtered/is4ZtB0U7Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.45], [28.0, 29.71], [31.0, 31.45], [38.0, 51.41], [67.0, 88.8], [93.0, 115.75], [117.0, 127.74], [129.0, 129.95], [131.0, 156.96], [157.0, 157.03], [157.0, 205.14], [206.0, 207.76], [209.0, 209.97], [211.0, 214.66]], "keep_status": [true, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [28.95, 0.0, 0.0, 29.27, 28.73, 28.63, 29.22, 0.0, 29.06, 0.0, 0.0, 0.0, 0.0, 32.5], "audiomae_on_audioset": [[["music", 32.08], ["vehicle", 7.03], ["race car, auto racing", 3.49]], null, null, [["music", 39.1], ["explosion", 8.01], ["speech", 6.49]], [["music", 26.51], ["speech", 21.96], ["hum", 7.57]], [["music", 45.48], ["speech", 12.31], ["hum", 3.16]], [["speech", 43.16], ["music", 34.4], ["throbbing", 6.04]], null, [["speech", 57.83], ["music", 13.57], ["explosion", 7.86]], null, null, null, null, [["speech", 19.81], ["music", 15.43], ["hum", 15.12]]], "duration": [9.45, 1.71, 0.45, 13.41, 21.8, 22.75, 10.74, 0.95, 25.96, 0.03, 48.14, 1.76, 0.97, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/isBwMtlWLeE_filtered.json b/annotations_filtered/isBwMtlWLeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48880e8b9741d10af9355e74a2ee25764c174e52 --- /dev/null +++ b/annotations_filtered/isBwMtlWLeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.39], [25.0, 24.85], [29.0, 34.01], [35.0, 35.04], [36.0, 44.42], [46.0, 47.04], [47.0, 50.45], [51.0, 61.69], [63.0, 63.24], [65.0, 65.91], [68.0, 68.15], [72.0, 72.82], [79.0, 79.2], [80.0, 80.23], [85.0, 85.5], [89.0, 89.8], [92.0, 92.43], [95.0, 95.49], [97.0, 98.64], [99.0, 99.59], [100.0, 100.89], [104.0, 104.89], [109.0, 109.36], [110.0, 110.89], [114.0, 114.54], [118.0, 118.66], [120.0, 122.12], [123.0, 123.13], [124.0, 124.95], [125.0, 125.98], [127.0, 127.48], [128.0, 129.27], [130.0, 133.68], [135.0, 135.26], [139.0, 140.39], [144.0, 145.91], [148.0, 148.71]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [31.41, 0.0, 54.5, 0.0, 51.02, 0.0, 37.55, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 0.0, 36.06, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.07], ["electric shaver, electric razor", 18.35], ["music", 12.0]], null, null, null, null, null, [["speech", 39.94], ["sidetone", 31.08], ["chirp tone", 4.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 49.33], ["speech", 18.77], ["whale vocalization", 7.71]], null, null, null, null, null, [["speech", 22.1], ["fly, housefly", 14.78], ["hum", 9.12]], null, null, null, null], "duration": [9.39, -0.15, 5.01, 0.04, 8.42, 1.04, 3.45, 10.69, 0.24, 0.91, 0.15, 0.82, 0.2, 0.23, 0.5, 0.8, 0.43, 0.49, 1.64, 0.59, 0.89, 0.89, 0.36, 0.89, 0.54, 0.66, 2.12, 0.13, 0.95, 0.98, 0.48, 1.27, 3.68, 0.26, 1.39, 1.91, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/isFVKJA4E-k_filtered.json b/annotations_filtered/isFVKJA4E-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59e9268b9c7476419285ac6fe173f4738805d630 --- /dev/null +++ b/annotations_filtered/isFVKJA4E-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [15.0, 16.01], [20.0, 20.61], [33.0, 34.06], [36.0, 36.68], [37.0, 38.85], [59.0, 59.22], [60.0, 60.08], [63.0, 63.31], [64.0, 65.1], [66.0, 66.02], [68.0, 69.13], [75.0, 76.89], [79.0, 85.28], [86.0, 86.81], [87.0, 104.63], [105.0, 104.67], [106.0, 107.22], [108.0, 108.99], [111.0, 112.38], [113.0, 113.81], [114.0, 114.0], [114.0, 119.58], [121.0, 131.4], [133.0, 133.95], [136.0, 137.3], [139.0, 139.9], [141.0, 141.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 66.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.71], ["cattle, bovinae", 13.82], ["moo", 13.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.01, 0.61, 1.06, 0.68, 1.85, 0.22, 0.08, 0.31, 1.1, 0.02, 1.13, 1.89, 6.28, 0.81, 17.63, -0.33, 1.22, 0.99, 1.38, 0.81, 0.0, 5.58, 10.4, 0.95, 1.3, 0.9, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/isct-XNu38E_filtered.json b/annotations_filtered/isct-XNu38E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30fca7df9443da7de8059c28dfebb3b0c0dd663f --- /dev/null +++ b/annotations_filtered/isct-XNu38E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [11.0, 12.58], [14.0, 41.49], [42.0, 54.14], [55.0, 57.0], [58.0, 65.74], [67.0, 76.18], [79.0, 79.59], [82.0, 82.44], [86.0, 85.89], [90.0, 93.19], [94.0, 95.25], [97.0, 99.42], [104.0, 106.47], [107.0, 110.1], [111.0, 115.37], [125.0, 128.53], [132.0, 171.41], [172.0, 182.41], [183.0, 183.95], [187.0, 190.58], [191.0, 191.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.47, 95.91, 99.97, 99.62, 91.98, 0.0, 0.0, 0.0, 64.75, 0.0, 97.73, 96.04, 87.55, 99.87, 38.35, 0.0, 34.73, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 16.84], ["hum", 9.83], ["music", 6.65]], null, [["whack, thwack", 33.44], ["speech", 32.91], ["music", 8.18]], null, null, null], "duration": [1.28, 1.58, 27.49, 12.14, 2.0, 7.74, 9.18, 0.59, 0.44, -0.11, 3.19, 1.25, 2.42, 2.47, 3.1, 4.37, 3.53, 39.41, 10.41, 0.95, 3.58, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/iseaUTEhwzY_filtered.json b/annotations_filtered/iseaUTEhwzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fba9b09e0a9e54751845e258af9de0eecd3d5e4c --- /dev/null +++ b/annotations_filtered/iseaUTEhwzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.99], [16.0, 16.95], [19.0, 19.08], [30.0, 31.04], [33.0, 34.72], [35.0, 36.32]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.99, 0.95, 0.08, 1.04, 1.72, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/isgx4Srs9t8_filtered.json b/annotations_filtered/isgx4Srs9t8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f675f82d5450c44b1deac0e5a84537f78e6fb36 --- /dev/null +++ b/annotations_filtered/isgx4Srs9t8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.51], [6.0, 6.03], [8.0, 8.19], [11.0, 12.31], [13.0, 14.12], [18.0, 19.33], [21.0, 21.27], [23.0, 24.22], [26.0, 26.38], [28.0, 30.03], [31.0, 31.95], [32.0, 33.17], [35.0, 36.54], [37.0, 43.58], [44.0, 44.88], [46.0, 46.55], [50.0, 51.11], [52.0, 52.68], [55.0, 59.59], [61.0, 67.12], [69.0, 69.38], [70.0, 70.58], [72.0, 72.76], [75.0, 75.3], [78.0, 80.94], [82.0, 87.52], [89.0, 90.15], [92.0, 91.81], [92.0, 93.82], [96.0, 100.72], [102.0, 104.09], [108.0, 108.36], [112.0, 113.76], [115.0, 117.66], [121.0, 121.2], [122.0, 124.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.33, 0.0, 0.0, 0.0, 0.0, 100.0, 99.92, 0.0, 0.0, 0.0, 98.73, 98.36, 0.0, 0.0, 99.93, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 0.03, 0.19, 1.31, 1.12, 1.33, 0.27, 1.22, 0.38, 2.03, 0.95, 1.17, 1.54, 6.58, 0.88, 0.55, 1.11, 0.68, 4.59, 6.12, 0.38, 0.58, 0.76, 0.3, 2.94, 5.52, 1.15, -0.19, 1.82, 4.72, 2.09, 0.36, 1.76, 2.66, 0.2, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/iswgTDjihrU_filtered.json b/annotations_filtered/iswgTDjihrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bd9bc5dc5d9d21e8162a759fddf5f2c5f8c3a37 --- /dev/null +++ b/annotations_filtered/iswgTDjihrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 53.25], [64.0, 81.57], [90.0, 118.0], [118.0, 152.78], [155.0, 167.95], [170.0, 181.99], [182.0, 189.31]], "keep_status": [false, true, false, false, true, true, false], "silence_prob": [28.73, 28.52, 28.74, 0.0, 28.75, 28.56, 29.76], "audiomae_on_audioset": [[["music", 62.4], ["throbbing", 18.08], ["hum", 6.56]], [["music", 34.13], ["siren", 19.71], ["vehicle", 6.7]], [["music", 50.66], ["throbbing", 28.29], ["hum", 10.56]], null, [["music", 18.31], ["hum", 17.38], ["buzz", 15.27]], [["speech", 34.3], ["music", 18.7], ["burst, pop", 3.45]], [["speech", 59.24], ["music", 16.88], ["explosion", 5.47]]], "duration": [29.25, 17.57, 28.0, 34.78, 12.95, 11.99, 7.31]} \ No newline at end of file diff --git a/annotations_filtered/isyFunAeYnQ_filtered.json b/annotations_filtered/isyFunAeYnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d6346872aa90b86956dd32c6bdc874ba3748aa --- /dev/null +++ b/annotations_filtered/isyFunAeYnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [4.0, 4.51], [9.0, 9.0], [11.0, 11.28], [19.0, 26.22], [28.0, 27.94], [30.0, 30.21], [34.0, 34.72], [36.0, 36.41], [38.0, 41.05], [42.0, 43.28], [44.0, 43.92], [49.0, 81.87], [93.0, 93.66], [96.0, 97.97], [100.0, 100.36]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 0.0, 37.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.07], ["music", 17.53], ["crowd", 11.32]], null, null, null, null, [["music", 16.29], ["hum", 12.17], ["mains hum", 11.93]], null, null, null, null, null, null], "duration": [0.93, 0.51, 0.0, 0.28, 7.22, -0.06, 0.21, 0.72, 0.41, 3.05, 1.28, -0.08, 32.87, 0.66, 1.97, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/itHVWrhsRSc_filtered.json b/annotations_filtered/itHVWrhsRSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d359fda9401cbbdc1fad922d8a3b869c8b129eb5 --- /dev/null +++ b/annotations_filtered/itHVWrhsRSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.9], [7.0, 16.9], [22.0, 24.06], [28.0, 29.17], [32.0, 36.02], [38.0, 39.87], [43.0, 45.25], [51.0, 54.57], [56.0, 57.52], [59.0, 61.08], [62.0, 65.64], [70.0, 71.02], [74.0, 75.84], [76.0, 77.01], [79.0, 79.24], [82.0, 87.3], [89.0, 89.11], [90.0, 92.45], [106.0, 108.53], [109.0, 109.14], [109.0, 111.91], [113.0, 115.89], [119.0, 122.42], [124.0, 125.42], [131.0, 132.33]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [39.24, 99.48, 65.2, 0.0, 98.1, 0.0, 44.75, 99.98, 0.0, 89.9, 32.71, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 66.15, 41.03, 0.0, 41.56, 60.7, 41.87, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 66.79], ["sidetone", 8.88], ["hum", 2.23]], null, null, null, null, null, [["speech", 19.8], ["music", 4.91], ["echo", 3.45]], null, null, null, [["cattle, bovinae", 26.72], ["moo", 20.56], ["livestock, farm animals, working animals", 15.02]], null, null, null, null, null, null, null, [["music", 21.7], ["crow", 18.62], ["frog", 16.69]], null, [["speech", 30.84], ["music", 26.94], ["buzzer", 5.42]], null, [["speech", 36.34], ["chirp tone", 26.53], ["busy signal", 8.77]], null, null], "duration": [2.9, 9.9, 2.06, 1.17, 4.02, 1.87, 2.25, 3.57, 1.52, 2.08, 3.64, 1.02, 1.84, 1.01, 0.24, 5.3, 0.11, 2.45, 2.53, 0.14, 2.91, 2.89, 3.42, 1.42, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/itIDxKxfGJI_filtered.json b/annotations_filtered/itIDxKxfGJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efb409924f27ca82392ea29a87a070fbd6e135a9 --- /dev/null +++ b/annotations_filtered/itIDxKxfGJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.19], [9.0, 9.75], [13.0, 14.89], [16.0, 16.36], [17.0, 18.32], [19.0, 20.29], [21.0, 67.46], [68.0, 70.39], [74.0, 74.17], [75.0, 87.96], [89.0, 105.17]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.77, 0.0, 32.73, 40.41], "audiomae_on_audioset": [[["fart", 20.5], ["throbbing", 8.68], ["speech", 6.41]], null, null, null, null, null, null, [["music", 65.05], ["didgeridoo", 10.54], ["musical instrument", 3.51]], null, [["music", 53.13], ["speech", 25.4], ["guitar", 4.05]], [["music", 49.55], ["thunk", 28.39], ["theremin", 8.85]]], "duration": [3.19, 0.75, 1.89, 0.36, 1.32, 1.29, 46.46, 2.39, 0.17, 12.96, 16.17]} \ No newline at end of file diff --git a/annotations_filtered/it_WqpOBfWI_filtered.json b/annotations_filtered/it_WqpOBfWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb8bc76ed8db713ef1c2d526fb9e5705833022c0 --- /dev/null +++ b/annotations_filtered/it_WqpOBfWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.06], [14.0, 14.08], [18.0, 19.2], [20.0, 21.64], [23.0, 24.19], [26.0, 29.57], [30.0, 31.02], [31.0, 32.39], [35.0, 36.64], [37.0, 37.03], [37.0, 37.25], [38.0, 40.14], [46.0, 49.18], [61.0, 61.57], [71.0, 71.74], [72.0, 73.9], [74.0, 77.04], [79.0, 79.74], [83.0, 85.4], [92.0, 97.11], [99.0, 99.71], [101.0, 102.2], [107.0, 107.2], [108.0, 150.6], [151.0, 158.45], [160.0, 161.15], [178.0, 180.4]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.79, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 41.87, 0.0, 0.0, 0.0, 68.8, 0.0, 79.94, 48.91, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 55.81], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.37], ["moo", 11.33], ["cattle, bovinae", 11.27]], null, null, null, null, null, null, [["music", 42.46], ["speech", 18.27], ["synthesizer", 8.27]], null, null, null, null, null, null, [["throbbing", 52.72], ["music", 23.34], ["hum", 15.77]], null, null, null, null, [["music", 87.98], ["speech", 2.35], ["musical instrument", 0.65]], null, null], "duration": [1.06, 0.08, 1.2, 1.64, 1.19, 3.57, 1.02, 1.39, 1.64, 0.03, 0.25, 2.14, 3.18, 0.57, 0.74, 1.9, 3.04, 0.74, 2.4, 5.11, 0.71, 1.2, 0.2, 42.6, 7.45, 1.15, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/itdD328hLuQ_filtered.json b/annotations_filtered/itdD328hLuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46bd513c7257dffc70591c9ce7333bacfa59e438 --- /dev/null +++ b/annotations_filtered/itdD328hLuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [13.0, 13.9], [15.0, 18.28], [34.0, 39.07], [44.0, 43.8], [44.0, 44.04], [47.0, 52.46], [55.0, 55.78], [58.0, 64.67], [66.0, 66.55], [71.0, 70.93], [77.0, 78.07], [80.0, 80.49]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.76, 42.39, 0.0, 0.0, 50.41, 0.0, 32.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["boing", 54.52], ["quack", 8.27], ["speech", 5.9]], [["noise", 29.09], ["crushing", 17.4], ["hum", 4.87]], null, null, null, null, [["speech", 69.09], ["beatboxing", 7.84], ["fart", 5.24]], null, null, null, null], "duration": [1.01, 0.9, 3.28, 5.07, -0.2, 0.04, 5.46, 0.78, 6.67, 0.55, -0.07, 1.07, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/iuKNXP9LcSg_filtered.json b/annotations_filtered/iuKNXP9LcSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f84c879081aec5b5840478c3a35965ffb95232 --- /dev/null +++ b/annotations_filtered/iuKNXP9LcSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.76], [28.0, 29.67], [30.0, 31.08], [43.0, 43.83], [57.0, 57.32], [60.0, 59.83], [62.0, 62.48], [67.0, 68.71], [74.0, 76.32], [82.0, 83.73], [85.0, 84.86], [90.0, 92.43], [96.0, 96.65], [100.0, 100.23], [102.0, 102.91], [104.0, 106.19], [107.0, 108.26], [110.0, 110.49], [116.0, 123.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 45.98, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 36.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.93], ["noise", 4.05], ["inside, small room", 4.04]], null, null, null, null, null, null, [["noise", 87.75], ["music", 2.25], ["synthesizer", 1.36]]], "duration": [1.76, 1.67, 1.08, 0.83, 0.32, -0.17, 0.48, 1.71, 2.32, 1.73, -0.14, 2.43, 0.65, 0.23, 0.91, 2.19, 1.26, 0.49, 7.33]} \ No newline at end of file diff --git a/annotations_filtered/iuL2loyB1bk_filtered.json b/annotations_filtered/iuL2loyB1bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99e801e3ee8476c65dc6cfe796f1a0922cc6ceed --- /dev/null +++ b/annotations_filtered/iuL2loyB1bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.38], [12.0, 14.94], [15.0, 21.49], [27.0, 28.19], [29.0, 29.46], [38.0, 38.5], [41.0, 40.93], [50.0, 50.31], [54.0, 54.67], [69.0, 69.65], [75.0, 76.99], [90.0, 90.61], [94.0, 95.37]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 98.86, 46.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.68], ["thunk", 19.96], ["synthesizer", 5.73]], null, null, null, null, null, null, null, null, null, null], "duration": [3.38, 2.94, 6.49, 1.19, 0.46, 0.5, -0.07, 0.31, 0.67, 0.65, 1.99, 0.61, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/iuPDl6n2vO0_filtered.json b/annotations_filtered/iuPDl6n2vO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64c3f20e83333e381de0e222d99a8bc6004a6223 --- /dev/null +++ b/annotations_filtered/iuPDl6n2vO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.99], [12.0, 13.09], [15.0, 16.6], [17.0, 17.78], [18.0, 19.92], [21.0, 21.47], [23.0, 26.47], [28.0, 28.8], [32.0, 32.12], [35.0, 36.19], [43.0, 43.87], [47.0, 51.63], [52.0, 52.54], [60.0, 60.47], [62.0, 62.04], [62.0, 64.02], [65.0, 66.87], [68.0, 71.9], [73.0, 74.24], [76.0, 76.92], [85.0, 86.58], [88.0, 89.73], [92.0, 92.91], [97.0, 97.19], [99.0, 99.0], [104.0, 105.48], [109.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.28, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 68.54, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52], "audiomae_on_audioset": [[["music", 74.06], ["musical instrument", 4.02], ["speech", 3.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.99, 1.09, 1.6, 0.78, 1.92, 0.47, 3.47, 0.8, 0.12, 1.19, 0.87, 4.63, 0.54, 0.47, 0.04, 2.02, 1.87, 3.9, 1.24, 0.92, 1.58, 1.73, 0.91, 0.19, 0.0, 1.48, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/iv1eE7qxDXA_filtered.json b/annotations_filtered/iv1eE7qxDXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf369387624866e3765c78e04b73cbe99a88388f --- /dev/null +++ b/annotations_filtered/iv1eE7qxDXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [7.0, 38.5], [40.0, 39.6], [53.0, 55.81], [56.0, 56.32], [59.0, 70.5], [82.0, 82.61], [89.0, 98.14], [101.0, 103.38], [118.0, 118.37], [118.0, 120.5]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.66, 0.0, 42.51, 0.0, 42.91, 48.74, 0.0, 52.22], "audiomae_on_audioset": [null, null, null, null, null, [["music", 22.52], ["speech", 20.83], ["fly, housefly", 11.91]], null, [["music", 38.93], ["wild animals", 10.62], ["speech", 8.2]], [["music", 39.7], ["speech", 11.97], ["throbbing", 6.07]], null, null], "duration": [0.66, 31.5, -0.4, 2.81, 0.32, 11.5, 0.61, 9.14, 2.38, 0.37, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/iv2j0CJkzbM_filtered.json b/annotations_filtered/iv2j0CJkzbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7ddc8ab6765ac3178b92b099afb4f8283c2124 --- /dev/null +++ b/annotations_filtered/iv2j0CJkzbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.52], [19.0, 30.32], [31.0, 31.89], [33.0, 35.02], [38.0, 38.64], [45.0, 46.06], [49.0, 61.48], [63.0, 64.03], [68.0, 69.31], [70.0, 70.87], [74.0, 77.14], [80.0, 85.09], [89.0, 88.53], [89.0, 92.03], [95.0, 94.81], [95.0, 95.67], [100.0, 100.08], [102.0, 109.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [74.76, 81.35, 0.0, 90.25, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 52.51, 83.16, 0.0, 93.6, 0.0, 0.0, 0.0, 36.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.98], ["music", 13.07], ["mains hum", 8.17]]], "duration": [3.52, 11.32, 0.89, 2.02, 0.64, 1.06, 12.48, 1.03, 1.31, 0.87, 3.14, 5.09, -0.47, 3.03, -0.19, 0.67, 0.08, 7.12]} \ No newline at end of file diff --git a/annotations_filtered/ivG26TnBWGI_filtered.json b/annotations_filtered/ivG26TnBWGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18308e37d1f6d22994505ffe26b685222a5f3717 --- /dev/null +++ b/annotations_filtered/ivG26TnBWGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.85], [10.0, 20.73], [22.0, 24.24], [27.0, 30.7], [32.0, 32.26], [34.0, 41.15], [43.0, 44.27], [45.0, 52.71], [58.0, 58.67], [59.0, 63.15], [66.0, 71.07], [71.0, 71.68], [74.0, 82.95], [84.0, 84.57], [86.0, 97.14], [106.0, 123.52]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.05, 29.86, 30.06, 31.35, 0.0, 29.5, 0.0, 29.18, 0.0, 34.22, 30.0, 0.0, 30.37, 0.0, 29.61, 29.28], "audiomae_on_audioset": [[["music", 37.84], ["speech", 37.49], ["throbbing", 8.06]], [["music", 27.45], ["speech", 24.49], ["fly, housefly", 3.64]], [["music", 38.06], ["speech", 10.47], ["vehicle", 7.57]], [["music", 35.23], ["hum", 17.8], ["mains hum", 17.5]], null, [["music", 41.13], ["speech", 40.05], ["theremin", 1.77]], null, [["music", 42.25], ["didgeridoo", 21.36], ["theremin", 9.6]], null, [["music", 69.77], ["speech", 5.97], ["electronic music", 3.25]], [["music", 49.43], ["thunk", 12.9], ["whack, thwack", 9.84]], null, [["speech", 29.95], ["mains hum", 13.25], ["animal", 10.46]], null, [["music", 65.19], ["throbbing", 4.34], ["musical instrument", 2.29]], [["fly, housefly", 40.62], ["insect", 37.16], ["mosquito", 16.52]]], "duration": [3.85, 10.73, 2.24, 3.7, 0.26, 7.15, 1.27, 7.71, 0.67, 4.15, 5.07, 0.68, 8.95, 0.57, 11.14, 17.52]} \ No newline at end of file diff --git a/annotations_filtered/ivGfI_8TE9I_filtered.json b/annotations_filtered/ivGfI_8TE9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d2ae835d0b41ad844ebb6ae42afd471a4564e2a --- /dev/null +++ b/annotations_filtered/ivGfI_8TE9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.81], [17.0, 17.63], [18.0, 20.63], [24.0, 25.0], [28.0, 28.63], [30.0, 30.48], [33.0, 33.86], [39.0, 50.53], [52.0, 53.11], [64.0, 65.3], [66.0, 66.87], [77.0, 82.75], [85.0, 85.78], [87.0, 90.02], [91.0, 97.16], [98.0, 119.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [77.36, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 99.31, 0.0, 99.48, 96.54, 90.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.81, 0.63, 2.63, 1.0, 0.63, 0.48, 0.86, 11.53, 1.11, 1.3, 0.87, 5.75, 0.78, 3.02, 6.16, 21.5]} \ No newline at end of file diff --git a/annotations_filtered/ivZaXeAv5X4_filtered.json b/annotations_filtered/ivZaXeAv5X4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c55b319903838e3d42ed1e566b61dc12788dcaf --- /dev/null +++ b/annotations_filtered/ivZaXeAv5X4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.44], [10.0, 14.71], [17.0, 16.77], [19.0, 19.35], [20.0, 45.27], [48.0, 48.64], [50.0, 59.9], [62.0, 98.66], [102.0, 103.54], [105.0, 111.75], [115.0, 118.34], [119.0, 119.52], [121.0, 121.78], [124.0, 124.43], [126.0, 133.07], [137.0, 142.65], [146.0, 151.82], [153.0, 159.21]], "keep_status": [false, true, false, false, true, false, false, false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 34.77, 0.0, 0.0, 34.82, 0.0, 34.32, 0.0, 0.0, 32.93, 32.01, 0.0, 0.0, 0.0, 61.37, 48.19, 73.97, 54.7], "audiomae_on_audioset": [null, [["speech", 32.15], ["music", 25.42], ["foghorn", 8.39]], null, null, [["music", 25.51], ["buzz", 16.85], ["speech", 8.72]], null, [["music", 70.03], ["scary music", 11.25], ["mains hum", 2.99]], null, null, [["music", 26.54], ["hum", 13.24], ["mains hum", 8.74]], [["thunk", 13.97], ["fly, housefly", 8.93], ["mosquito", 5.85]], null, null, null, null, [["music", 16.79], ["livestock, farm animals, working animals", 12.27], ["cattle, bovinae", 11.89]], null, null], "duration": [1.44, 4.71, -0.23, 0.35, 25.27, 0.64, 9.9, 36.66, 1.54, 6.75, 3.34, 0.52, 0.78, 0.43, 7.07, 5.65, 5.82, 6.21]} \ No newline at end of file diff --git a/annotations_filtered/iv_Q51lofKM_filtered.json b/annotations_filtered/iv_Q51lofKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ecd9f5b4d0977f8073d2e6dcd32e8617b425b1e --- /dev/null +++ b/annotations_filtered/iv_Q51lofKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.47], [16.0, 16.77], [17.0, 17.78], [20.0, 22.27], [29.0, 29.57], [30.0, 36.53], [40.0, 40.86], [41.0, 41.5], [45.0, 48.0], [48.0, 48.03], [48.0, 48.07], [49.0, 48.71], [54.0, 55.54], [57.0, 58.46], [71.0, 71.44], [79.0, 80.35], [95.0, 95.2], [96.0, 96.3], [97.0, 97.75], [98.0, 98.24], [101.0, 104.58], [110.0, 111.03], [112.0, 115.52], [116.0, 116.04], [118.0, 117.68], [130.0, 133.52], [134.0, 134.62], [145.0, 145.17], [148.0, 148.36]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [42.39, 0.0, 0.0, 46.09, 0.0, 39.96, 0.0, 0.0, 35.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 0.0, 42.67, 0.0, 0.0, 35.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.01], ["thunk", 31.35], ["breaking", 3.38]], null, null, [["speech", 29.54], ["music", 18.66], ["noise", 5.76]], null, [["music", 40.74], ["speech", 35.31], ["sidetone", 2.39]], null, null, [["speech", 53.35], ["music", 16.3], ["speech synthesizer", 6.57]], null, null, null, null, null, null, null, null, null, null, null, [["music", 53.78], ["throbbing", 5.97], ["hum", 3.77]], null, [["music", 60.01], ["throbbing", 17.12], ["hum", 5.68]], null, null, [["cattle, bovinae", 26.92], ["music", 21.48], ["moo", 19.27]], null, null, null], "duration": [3.47, 0.77, 0.78, 2.27, 0.57, 6.53, 0.86, 0.5, 3.0, 0.03, 0.07, -0.29, 1.54, 1.46, 0.44, 1.35, 0.2, 0.3, 0.75, 0.24, 3.58, 1.03, 3.52, 0.04, -0.32, 3.52, 0.62, 0.17, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/ivmjSqQ_7aw_filtered.json b/annotations_filtered/ivmjSqQ_7aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7de25e560eb699a2c6411a666a92fd54ed2c2d6 --- /dev/null +++ b/annotations_filtered/ivmjSqQ_7aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [5.0, 6.32], [8.0, 8.56], [20.0, 19.87], [22.0, 24.33], [27.0, 27.01], [29.0, 29.96], [36.0, 35.97], [37.0, 37.2], [42.0, 43.14], [50.0, 50.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.32, 0.56, -0.13, 2.33, 0.01, 0.96, -0.03, 0.2, 1.14, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/ivzvZlKaKAs_filtered.json b/annotations_filtered/ivzvZlKaKAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b767b01268e16cc04e0a527b8cb86f935841e009 --- /dev/null +++ b/annotations_filtered/ivzvZlKaKAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [9.0, 10.45], [26.0, 29.62], [33.0, 33.35], [39.0, 39.61], [40.0, 40.15], [57.0, 57.72], [66.0, 66.23], [67.0, 67.76], [70.0, 72.28], [77.0, 77.89], [78.0, 78.44], [80.0, 81.43], [83.0, 89.75], [90.0, 90.95], [92.0, 92.23], [93.0, 94.71], [95.0, 100.97], [104.0, 104.46], [110.0, 111.5], [114.0, 116.77], [118.0, 119.87], [122.0, 123.8], [127.0, 126.99], [128.0, 129.68], [133.0, 133.76], [138.0, 138.28], [141.0, 143.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.58], ["didgeridoo", 5.64], ["musical instrument", 2.91]]], "duration": [-0.2, 1.45, 3.62, 0.35, 0.61, 0.15, 0.72, 0.23, 0.76, 2.28, 0.89, 0.44, 1.43, 6.75, 0.95, 0.23, 1.71, 5.97, 0.46, 1.5, 2.77, 1.87, 1.8, -0.01, 1.68, 0.76, 0.28, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/iw-0Y6HWb9Q_filtered.json b/annotations_filtered/iw-0Y6HWb9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33451406383d552e601f69be10390a8a38b061f3 --- /dev/null +++ b/annotations_filtered/iw-0Y6HWb9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.16], [8.0, 10.32], [12.0, 13.15], [17.0, 17.9], [19.0, 24.02], [25.0, 25.61], [27.0, 27.7], [30.0, 31.29], [32.0, 32.66], [33.0, 33.89], [35.0, 35.56], [38.0, 38.47], [39.0, 39.75], [44.0, 44.98], [45.0, 47.61], [48.0, 51.34], [52.0, 55.0], [62.0, 64.05], [67.0, 113.44], [114.0, 114.79], [115.0, 120.65], [122.0, 123.74], [124.0, 127.25], [128.0, 128.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [91.47, 67.51, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 81.89, 29.52, 61.27, 0.0, 0.0, 30.76, 0.0, 35.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.25], ["hum", 13.46], ["music", 7.81]], null, [["speech", 34.28], ["music", 18.98], ["thump, thud", 12.16]], null, null, null, [["explosion", 44.66], ["speech", 23.58], ["burst, pop", 13.68]], null, [["speech", 68.16], ["groan", 7.35], ["animal", 2.87]], null], "duration": [4.16, 2.32, 1.15, 0.9, 5.02, 0.61, 0.7, 1.29, 0.66, 0.89, 0.56, 0.47, 0.75, 0.98, 2.61, 3.34, 3.0, 2.05, 46.44, 0.79, 5.65, 1.74, 3.25, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/iwAciIQDE4A_filtered.json b/annotations_filtered/iwAciIQDE4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72a08ab452b9826b29a5eac83ea203fe58c4a18b --- /dev/null +++ b/annotations_filtered/iwAciIQDE4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.97], [15.0, 14.89], [16.0, 18.47], [26.0, 28.48], [29.0, 30.13], [39.0, 40.2], [57.0, 57.84], [62.0, 61.82], [64.0, 65.31], [71.0, 71.12], [76.0, 76.54], [78.0, 80.33], [81.0, 83.05], [84.0, 85.53], [89.0, 89.04], [92.0, 93.07], [98.0, 98.04], [100.0, 100.62], [102.0, 102.46], [108.0, 108.8], [122.0, 126.96], [129.0, 129.64], [130.0, 132.65], [135.0, 135.28]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 44.99, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 23.56], ["music", 19.43], ["didgeridoo", 9.45]], [["thunk", 57.68], ["music", 16.59], ["throbbing", 8.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.93], ["music", 5.46], ["boing", 4.41]], null, null, null], "duration": [0.97, -0.11, 2.47, 2.48, 1.13, 1.2, 0.84, -0.18, 1.31, 0.12, 0.54, 2.33, 2.05, 1.53, 0.04, 1.07, 0.04, 0.62, 0.46, 0.8, 4.96, 0.64, 2.65, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/iwGU5hY6stw_filtered.json b/annotations_filtered/iwGU5hY6stw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..806ca80c4619f0edd5fafcb73e57e3bb9ad0ea6a --- /dev/null +++ b/annotations_filtered/iwGU5hY6stw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.54], [13.0, 15.48], [19.0, 19.77], [23.0, 24.06], [31.0, 32.34], [42.0, 72.57], [73.0, 78.04], [78.0, 89.99], [95.0, 120.72], [121.0, 126.3], [128.0, 129.76], [130.0, 130.35], [131.0, 132.06], [132.0, 134.27]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 30.78, 0.0, 0.0, 0.0, 0.0, 28.97, 29.06, 29.01, 27.93, 0.0, 0.0, 0.0, 28.2], "audiomae_on_audioset": [null, [["music", 55.17], ["mains hum", 10.64], ["hum", 9.38]], null, null, null, null, [["music", 36.66], ["theremin", 17.07], ["didgeridoo", 12.62]], [["music", 53.56], ["hum", 7.22], ["throbbing", 4.64]], [["music", 51.08], ["didgeridoo", 16.89], ["hum", 10.73]], [["livestock, farm animals, working animals", 51.7], ["cattle, bovinae", 38.16], ["moo", 7.14]], null, null, null, [["rumble", 20.11], ["fly, housefly", 17.94], ["insect", 12.93]]], "duration": [1.54, 2.48, 0.77, 1.06, 1.34, 30.57, 5.04, 11.99, 25.72, 5.3, 1.76, 0.35, 1.06, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/iwXsuJXUau4_filtered.json b/annotations_filtered/iwXsuJXUau4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0500d29174add10ab4c13fcf8b3b296708e43e1 --- /dev/null +++ b/annotations_filtered/iwXsuJXUau4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.31], [7.0, 7.74], [10.0, 10.27], [11.0, 13.27], [14.0, 15.97], [24.0, 24.51], [26.0, 26.1], [27.0, 41.44], [43.0, 46.97], [48.0, 48.74], [50.0, 52.89], [55.0, 55.93], [57.0, 60.51], [65.0, 65.67], [66.0, 68.52], [69.0, 76.35], [77.0, 89.83], [91.0, 94.61], [98.0, 99.81], [106.0, 109.48], [111.0, 111.64], [114.0, 118.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 94.52, 0.0, 99.96, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.31, 0.74, 0.27, 2.27, 1.97, 0.51, 0.1, 14.44, 3.97, 0.74, 2.89, 0.93, 3.51, 0.67, 2.52, 7.35, 12.83, 3.61, 1.81, 3.48, 0.64, 4.12]} \ No newline at end of file diff --git a/annotations_filtered/iwfU4ei5gWE_filtered.json b/annotations_filtered/iwfU4ei5gWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5efab507d829ff804adcae443664ec2575267b5 --- /dev/null +++ b/annotations_filtered/iwfU4ei5gWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.83], [23.0, 23.06], [28.0, 28.78], [36.0, 37.37], [39.0, 39.01], [41.0, 41.86], [48.0, 48.19], [49.0, 49.33], [52.0, 53.08], [56.0, 56.86], [58.0, 58.33], [66.0, 67.27], [72.0, 86.98], [88.0, 88.72], [90.0, 90.66], [95.0, 95.25], [100.0, 100.23], [111.0, 114.39], [119.0, 119.28], [121.0, 121.12], [122.0, 128.63], [130.0, 130.44], [137.0, 137.24], [141.0, 140.93], [144.0, 145.03], [150.0, 150.33], [157.0, 157.49], [159.0, 159.19], [162.0, 162.04], [163.0, 163.71], [164.0, 165.05], [167.0, 167.29], [171.0, 171.44], [178.0, 179.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.3, 0.0, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.17], ["speech", 12.07], ["animal", 8.81]], null, null, null, null, [["speech", 59.93], ["music", 6.49], ["didgeridoo", 2.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.17, 0.06, 0.78, 1.37, 0.01, 0.86, 0.19, 0.33, 1.08, 0.86, 0.33, 1.27, 14.98, 0.72, 0.66, 0.25, 0.23, 3.39, 0.28, 0.12, 6.63, 0.44, 0.24, -0.07, 1.03, 0.33, 0.49, 0.19, 0.04, 0.71, 1.05, 0.29, 0.44, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/iwxe2sIgQL0_filtered.json b/annotations_filtered/iwxe2sIgQL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c278db80deb9879b50f54fbfb03eada121d16121 --- /dev/null +++ b/annotations_filtered/iwxe2sIgQL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [5.0, 7.6], [17.0, 18.17], [24.0, 24.19], [30.0, 31.35], [37.0, 36.76], [41.0, 41.42], [49.0, 48.84], [50.0, 51.51], [52.0, 53.91], [55.0, 56.05], [57.0, 57.77], [59.0, 60.12], [62.0, 63.49], [66.0, 67.64], [69.0, 70.51], [75.0, 76.47]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 16.81], ["insect", 10.74], ["crushing", 6.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 2.6, 1.17, 0.19, 1.35, -0.24, 0.42, -0.16, 1.51, 1.91, 1.05, 0.77, 1.12, 1.49, 1.64, 1.51, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/ixYWkDAPPzA_filtered.json b/annotations_filtered/ixYWkDAPPzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9254ddb5e48fed9e314684b9217b2c4c3edf057e --- /dev/null +++ b/annotations_filtered/ixYWkDAPPzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.09], [26.0, 26.64], [28.0, 28.36], [32.0, 32.8], [45.0, 46.63], [47.0, 48.63], [51.0, 51.43], [53.0, 53.81], [57.0, 65.57], [68.0, 68.69], [73.0, 105.49], [111.0, 129.37], [135.0, 151.28], [152.0, 153.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.85, 0.0, 0.0, 48.27, 41.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 47.12], ["speech", 21.5], ["theremin", 8.39]], null, null, [["music", 39.65], ["synthesizer", 16.84], ["keyboard (musical)", 7.84]], [["music", 41.01], ["speech", 21.19], ["ambient music", 9.41]], null], "duration": [0.09, 0.64, 0.36, 0.8, 1.63, 1.63, 0.43, 0.81, 8.57, 0.69, 32.49, 18.37, 16.28, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/ixbStXcVqW4_filtered.json b/annotations_filtered/ixbStXcVqW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf5dafa3c80c16b30b79712a0dd31c946cf71acb --- /dev/null +++ b/annotations_filtered/ixbStXcVqW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 21.15], [25.0, 49.74], [52.0, 57.77], [60.0, 61.32], [64.0, 64.12], [69.0, 87.78], [107.0, 107.5], [111.0, 111.74], [112.0, 127.8]], "keep_status": [true, true, true, false, false, false, false, false, false], "silence_prob": [32.18, 33.94, 37.05, 0.0, 0.0, 31.54, 0.0, 0.0, 34.75], "audiomae_on_audioset": [[["music", 34.56], ["speech", 26.14], ["electric shaver, electric razor", 4.56]], [["music", 35.32], ["speech", 20.18], ["sitar", 5.12]], [["music", 49.25], ["speech", 15.55], ["foghorn", 3.41]], null, null, [["livestock, farm animals, working animals", 31.69], ["moo", 26.7], ["cattle, bovinae", 20.86]], null, null, [["music", 36.94], ["speech", 32.06], ["foghorn", 9.27]]], "duration": [21.15, 24.74, 5.77, 1.32, 0.12, 18.78, 0.5, 0.74, 15.8]} \ No newline at end of file diff --git a/annotations_filtered/ixljWVyPby0_filtered.json b/annotations_filtered/ixljWVyPby0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eaf078cf0008181a17beec59e26d1c212dd901e2 --- /dev/null +++ b/annotations_filtered/ixljWVyPby0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.48], [12.0, 12.46], [14.0, 15.3], [16.0, 16.28], [21.0, 21.42], [29.0, 30.03], [32.0, 33.08], [34.0, 34.62], [36.0, 36.8], [38.0, 39.04], [40.0, 44.41], [47.0, 55.78], [59.0, 62.09], [63.0, 63.78], [65.0, 66.7], [71.0, 72.08], [75.0, 76.03], [77.0, 78.19], [85.0, 85.75], [88.0, 90.86], [93.0, 94.2], [97.0, 97.44], [99.0, 99.54], [102.0, 102.73], [104.0, 120.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.7, 32.23, 30.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 30.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 28.56], ["hum", 10.74], ["throbbing", 9.23]], [["explosion", 28.5], ["hum", 21.68], ["throbbing", 10.19]], [["synthesizer", 22.64], ["music", 15.57], ["brass instrument", 12.07]], null, null, null, null, null, null, null, null, null, null, null, [["music", 75.32], ["brass instrument", 5.22], ["musical instrument", 4.04]]], "duration": [1.48, 0.46, 1.3, 0.28, 0.42, 1.03, 1.08, 0.62, 0.8, 1.04, 4.41, 8.78, 3.09, 0.78, 1.7, 1.08, 1.03, 1.19, 0.75, 2.86, 1.2, 0.44, 0.54, 0.73, 16.18]} \ No newline at end of file diff --git a/annotations_filtered/iy-SmSGYYBM_filtered.json b/annotations_filtered/iy-SmSGYYBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a524713cce6c1fb1fffb67c3f849801ac16f58 --- /dev/null +++ b/annotations_filtered/iy-SmSGYYBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.64], [47.0, 47.22], [51.0, 57.54], [67.0, 99.52], [103.0, 104.18]], "keep_status": [false, false, false, false, false], "silence_prob": [30.84, 0.0, 31.18, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.1], ["speech", 8.83], ["boing", 5.98]], null, [["music", 80.82], ["boing", 5.03], ["didgeridoo", 2.44]], null, null], "duration": [25.64, 0.22, 6.54, 32.52, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/iyCfFXxNtp8_filtered.json b/annotations_filtered/iyCfFXxNtp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddc613c9b515fabba574de4311caaf91042aa83d --- /dev/null +++ b/annotations_filtered/iyCfFXxNtp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [6.0, 6.86], [8.0, 9.36], [10.0, 12.11], [16.0, 17.78], [21.0, 22.38], [25.0, 25.57], [27.0, 28.98], [30.0, 30.33]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.86, 1.36, 2.11, 1.78, 1.38, 0.57, 1.98, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/iyHNryKojDY_filtered.json b/annotations_filtered/iyHNryKojDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5a051a0f567ff97291c8028da9ba64f72f1ae2e --- /dev/null +++ b/annotations_filtered/iyHNryKojDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.46], [9.0, 10.05], [12.0, 36.96], [42.0, 50.3], [53.0, 58.89], [59.0, 61.1], [63.0, 64.0], [68.0, 71.68], [77.0, 85.21], [93.0, 93.66], [94.0, 96.48], [97.0, 98.49], [101.0, 103.69], [107.0, 123.52], [128.0, 129.2]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [85.54, 0.0, 44.29, 55.81, 58.98, 62.17, 0.0, 42.35, 53.47, 0.0, 55.96, 0.0, 66.03, 47.39, 0.0], "audiomae_on_audioset": [null, null, [["music", 64.91], ["guitar", 9.98], ["bass guitar", 5.02]], null, null, null, null, [["music", 54.56], ["hum", 6.9], ["electronic music", 3.76]], null, null, null, null, null, [["music", 78.17], ["musical instrument", 4.49], ["synthesizer", 2.8]], null], "duration": [5.46, 1.05, 24.96, 8.3, 5.89, 2.1, 1.0, 3.68, 8.21, 0.66, 2.48, 1.49, 2.69, 16.52, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/iz2ro0h_TmQ_filtered.json b/annotations_filtered/iz2ro0h_TmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c895239727be28eabfc3a93c6f4d722bb13e9f0f --- /dev/null +++ b/annotations_filtered/iz2ro0h_TmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 50.77], [51.0, 84.92]], "keep_status": [false, false], "silence_prob": [30.58, 0.0], "audiomae_on_audioset": [[["music", 67.45], ["throbbing", 9.56], ["hum", 5.04]], null], "duration": [17.77, 33.92]} \ No newline at end of file diff --git a/annotations_filtered/iz3ETniN1NI_filtered.json b/annotations_filtered/iz3ETniN1NI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da67efc296f07bdebd6b7f71d35f4eea1147b675 --- /dev/null +++ b/annotations_filtered/iz3ETniN1NI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.28], [19.0, 21.3], [22.0, 22.89], [23.0, 25.57], [27.0, 29.1], [31.0, 31.99], [43.0, 46.85], [47.0, 51.44], [53.0, 53.97], [56.0, 57.11], [58.0, 60.69], [62.0, 63.54], [74.0, 74.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.29, 0.0, 94.66, 95.91, 0.0, 100.0, 98.93, 0.0, 0.0, 99.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 2.3, 0.89, 2.57, 2.1, 0.99, 3.85, 4.44, 0.97, 1.11, 2.69, 1.54, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/iz3l5GLSWJk_filtered.json b/annotations_filtered/iz3l5GLSWJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5064681b72899dae5bdf0de8b0d071f3bfab2be3 --- /dev/null +++ b/annotations_filtered/iz3l5GLSWJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.43], [4.0, 5.64], [7.0, 30.0], [30.0, 32.49], [35.0, 35.77], [56.0, 86.31], [87.0, 105.39], [107.0, 127.58], [129.0, 129.41]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [79.41, 0.0, 49.18, 80.46, 0.0, 0.0, 33.34, 32.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 34.67], ["hum", 28.58], ["mains hum", 11.68]], null, null, null, [["hum", 35.64], ["music", 25.46], ["throbbing", 17.15]], [["music", 55.16], ["theremin", 9.77], ["didgeridoo", 7.13]], null], "duration": [2.43, 1.64, 23.0, 2.49, 0.77, 30.31, 18.39, 20.58, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/izLhF-Oodrg_filtered.json b/annotations_filtered/izLhF-Oodrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86c76a5d9d709ea9a8d7bac94b2432f81929fca4 --- /dev/null +++ b/annotations_filtered/izLhF-Oodrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [6.0, 8.67], [10.0, 13.04], [14.0, 16.39], [22.0, 23.57], [25.0, 25.68], [28.0, 27.68], [30.0, 30.32], [33.0, 36.02], [45.0, 46.2], [49.0, 48.96], [55.0, 55.68], [57.0, 57.13], [58.0, 59.24], [61.0, 61.92], [66.0, 67.1], [69.0, 71.41], [72.0, 72.0], [73.0, 73.4], [75.0, 76.22], [80.0, 82.19], [86.0, 86.83], [90.0, 91.18], [92.0, 93.45], [99.0, 101.12], [103.0, 103.64], [105.0, 108.58], [112.0, 113.44], [116.0, 119.3], [121.0, 123.9], [125.0, 128.07], [134.0, 140.9], [146.0, 149.08], [151.0, 152.1], [153.0, 154.97], [156.0, 160.37], [161.0, 160.96], [161.0, 165.91], [167.0, 174.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.8, 74.44, 73.36, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 78.38, 0.0, 74.92, 0.0, 76.04, 90.08, 82.43, 95.51, 83.7, 0.0, 0.0, 70.44, 0.0, 65.44, 80.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 2.67, 3.04, 2.39, 1.57, 0.68, -0.32, 0.32, 3.02, 1.2, -0.04, 0.68, 0.13, 1.24, 0.92, 1.1, 2.41, 0.0, 0.4, 1.22, 2.19, 0.83, 1.18, 1.45, 2.12, 0.64, 3.58, 1.44, 3.3, 2.9, 3.07, 6.9, 3.08, 1.1, 1.97, 4.37, -0.04, 4.91, 7.51]} \ No newline at end of file diff --git a/annotations_filtered/izP8mDH8XOc_filtered.json b/annotations_filtered/izP8mDH8XOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2edc67451d09ce229d078533995c7ae844c3e2e --- /dev/null +++ b/annotations_filtered/izP8mDH8XOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [4.0, 5.64], [7.0, 82.22], [83.0, 121.88], [125.0, 151.7], [152.0, 152.73], [156.0, 156.15], [160.0, 161.42]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 20.62], ["hum", 16.04], ["mains hum", 12.24]], null, null, null], "duration": [0.12, 1.64, 75.22, 38.88, 26.7, 0.73, 0.15, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/izWrKfUUP9o_filtered.json b/annotations_filtered/izWrKfUUP9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..576c48adad1a481065163f48f667f6ad4110007f --- /dev/null +++ b/annotations_filtered/izWrKfUUP9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.88], [20.0, 27.18], [31.0, 31.99], [35.0, 37.03], [43.0, 44.39], [47.0, 48.88], [52.0, 57.59], [72.0, 73.53], [78.0, 78.7], [81.0, 82.0], [98.0, 98.79], [101.0, 100.99], [107.0, 108.33], [110.0, 110.73], [112.0, 113.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.36, 30.98, 0.0, 30.06, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.57], ["throbbing", 30.1], ["hum", 4.05]], [["music", 62.13], ["speech", 6.65], ["animal", 2.53]], null, [["music", 37.43], ["speech", 30.61], ["fart", 5.08]], null, null, [["music", 53.98], ["speech", 27.6], ["musical instrument", 3.4]], null, null, null, null, null, null, null, null], "duration": [3.88, 7.18, 0.99, 2.03, 1.39, 1.88, 5.59, 1.53, 0.7, 1.0, 0.79, -0.01, 1.33, 0.73, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/izxDdUcC3Ag_filtered.json b/annotations_filtered/izxDdUcC3Ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d86d9588e5c53471a499645eb2559a73579384e5 --- /dev/null +++ b/annotations_filtered/izxDdUcC3Ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.15], [21.0, 22.71], [23.0, 23.57], [24.0, 44.58], [45.0, 45.57], [49.0, 64.57], [68.0, 69.25], [73.0, 82.16], [83.0, 88.55], [90.0, 108.62], [109.0, 110.0], [110.0, 111.23], [113.0, 120.11], [122.0, 132.9], [142.0, 142.3]], "keep_status": [false, false, false, false, false, true, false, true, true, true, false, false, true, true, false], "silence_prob": [30.18, 0.0, 0.0, 30.68, 0.0, 46.36, 0.0, 32.55, 40.04, 32.26, 0.0, 0.0, 31.84, 30.52, 0.0], "audiomae_on_audioset": [[["music", 73.21], ["speech", 8.73], ["screaming", 7.18]], null, null, [["music", 41.61], ["speech", 31.59], ["fart", 3.49]], null, [["mains hum", 28.2], ["music", 21.57], ["hum", 19.01]], null, [["music", 28.44], ["groan", 16.39], ["speech", 13.89]], [["music", 37.94], ["electric shaver, electric razor", 10.26], ["speech", 5.29]], [["music", 43.76], ["animal", 9.25], ["speech", 4.4]], null, null, [["whack, thwack", 45.47], ["music", 15.47], ["thunk", 7.73]], [["music", 35.32], ["buzz", 10.87], ["speech", 4.3]], null], "duration": [3.15, 1.71, 0.57, 20.58, 0.57, 15.57, 1.25, 9.16, 5.55, 18.62, 1.0, 1.23, 7.11, 10.9, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/izxkFm060yU_filtered.json b/annotations_filtered/izxkFm060yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a545fe8bc9b2ab973bfe8eca234259ce903f18 --- /dev/null +++ b/annotations_filtered/izxkFm060yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.27], [8.0, 8.24], [13.0, 13.41], [14.0, 15.42], [25.0, 26.08], [31.0, 31.28], [32.0, 35.14], [37.0, 39.75], [40.0, 41.27], [42.0, 43.16], [44.0, 44.81], [46.0, 47.9], [49.0, 49.79], [51.0, 51.16], [52.0, 52.95], [54.0, 70.46], [88.0, 89.56], [91.0, 90.85], [95.0, 95.61], [101.0, 101.38], [108.0, 108.73], [110.0, 110.52], [111.0, 113.26], [114.0, 118.88]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [38.08, 0.0, 0.0, 0.0, 0.0, 0.0, 40.84, 43.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.16, 39.6], "audiomae_on_audioset": [[["music", 38.72], ["hum", 21.1], ["mains hum", 9.57]], null, null, null, null, null, [["music", 32.42], ["speech", 19.31], ["harp", 3.81]], [["speech", 32.51], ["music", 29.31], ["whale vocalization", 6.37]], null, null, null, null, null, null, null, [["music", 62.24], ["hum", 5.22], ["guitar", 4.96]], null, null, null, null, null, null, [["music", 47.12], ["speech", 12.73], ["guitar", 3.41]], [["music", 47.66], ["speech", 7.45], ["musical instrument", 5.42]]], "duration": [3.27, 0.24, 0.41, 1.42, 1.08, 0.28, 3.14, 2.75, 1.27, 1.16, 0.81, 1.9, 0.79, 0.16, 0.95, 16.46, 1.56, -0.15, 0.61, 0.38, 0.73, 0.52, 2.26, 4.88]} \ No newline at end of file