diff --git a/annotations_filtered/0-0MyjmphsA_filtered.json b/annotations_filtered/0-0MyjmphsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09abfb7fd286811d5572378d867b24f23f646d3f --- /dev/null +++ b/annotations_filtered/0-0MyjmphsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 29.22], [31.0, 31.62], [39.0, 49.87], [52.0, 66.21], [67.0, 79.44], [87.0, 87.57], [88.0, 88.74], [94.0, 93.93], [94.0, 93.97]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [34.68, 0.0, 31.74, 32.94, 98.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 62.3], ["crowd", 3.99], ["cheering", 3.84]], null, [["speech", 33.18], ["explosion", 20.64], ["artillery fire", 17.56]], [["explosion", 56.22], ["burst, pop", 15.34], ["speech", 7.0]], null, null, null, null, null], "duration": [5.22, 0.62, 10.87, 14.21, 12.44, 0.57, 0.74, -0.07, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/0-81bpcuz44_filtered.json b/annotations_filtered/0-81bpcuz44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f75b2fd0840254b3820f029c3d3d5b9c9f993e76 --- /dev/null +++ b/annotations_filtered/0-81bpcuz44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [5.0, 81.45], [85.0, 91.74], [94.0, 97.38], [101.0, 139.5], [140.0, 141.42], [142.0, 162.73]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.07, 40.93, 0.0, 0.0, 36.75], "audiomae_on_audioset": [null, null, null, [["music", 59.07], ["didgeridoo", 18.25], ["musical instrument", 7.92]], null, null, [["music", 76.76], ["boing", 5.26], ["didgeridoo", 3.37]]], "duration": [1.16, 76.45, 6.74, 3.38, 38.5, 1.42, 20.73]} \ No newline at end of file diff --git a/annotations_filtered/0-EcLwovpbU_filtered.json b/annotations_filtered/0-EcLwovpbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4d4ab9697c22e6e0ab2666639b7fff64f4493e2 --- /dev/null +++ b/annotations_filtered/0-EcLwovpbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 47.04], [48.0, 73.89], [75.0, 95.35], [97.0, 99.5], [100.0, 126.87]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 32.04, 30.73, 32.85, 32.24], "audiomae_on_audioset": [null, [["music", 72.36], ["didgeridoo", 7.21], ["musical instrument", 2.36]], [["music", 46.13], ["didgeridoo", 29.91], ["throbbing", 2.96]], [["music", 53.59], ["speech", 6.78], ["hum", 4.59]], [["hum", 55.11], ["throbbing", 20.92], ["mains hum", 8.2]]], "duration": [0.04, 25.89, 20.35, 2.5, 26.87]} \ No newline at end of file diff --git a/annotations_filtered/0-HM2VCdrC0_filtered.json b/annotations_filtered/0-HM2VCdrC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b7345624a2e8b6530d21a3ae2ae2abb40e1cb9a --- /dev/null +++ b/annotations_filtered/0-HM2VCdrC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.72], [13.0, 13.83], [23.0, 23.73], [30.0, 31.18], [32.0, 32.68], [33.0, 33.83], [50.0, 51.24], [53.0, 54.03], [59.0, 59.71], [60.0, 61.05], [68.0, 69.33], [72.0, 72.55], [75.0, 75.96], [82.0, 95.12], [96.0, 98.58], [99.0, 100.58], [104.0, 104.58], [108.0, 109.44], [111.0, 117.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 91.98, 0.0, 0.0, 0.0, 96.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.83, 0.73, 1.18, 0.68, 0.83, 1.24, 1.03, 0.71, 1.05, 1.33, 0.55, 0.96, 13.12, 2.58, 1.58, 0.58, 1.44, 6.71]} \ No newline at end of file diff --git a/annotations_filtered/0-Whu5Hlbz8_filtered.json b/annotations_filtered/0-Whu5Hlbz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ed237ccbad1bb293a1639457c74abace44cb796 --- /dev/null +++ b/annotations_filtered/0-Whu5Hlbz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.33], [22.0, 30.75], [31.0, 30.79], [33.0, 34.32], [36.0, 36.8], [39.0, 39.41], [40.0, 40.81], [42.0, 43.07], [45.0, 46.38], [48.0, 48.49], [51.0, 52.22], [53.0, 54.21], [57.0, 56.83], [57.0, 59.88], [60.0, 61.48], [64.0, 65.85], [69.0, 71.04], [72.0, 72.62], [74.0, 75.59], [77.0, 77.5], [79.0, 79.2], [80.0, 80.25], [81.0, 82.12], [83.0, 83.67], [84.0, 85.77], [88.0, 88.94], [90.0, 89.88], [92.0, 108.6], [109.0, 117.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.71], ["fly, housefly", 4.16], ["explosion", 2.49]]], "duration": [0.33, 8.75, -0.21, 1.32, 0.8, 0.41, 0.81, 1.07, 1.38, 0.49, 1.22, 1.21, -0.17, 2.88, 1.48, 1.85, 2.04, 0.62, 1.59, 0.5, 0.2, 0.25, 1.12, 0.67, 1.77, 0.94, -0.12, 16.6, 8.73]} \ No newline at end of file diff --git a/annotations_filtered/0-lcqIuVaR8_filtered.json b/annotations_filtered/0-lcqIuVaR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f14c2551230df6b35f5ee5f7063fbf3ec2177c6b --- /dev/null +++ b/annotations_filtered/0-lcqIuVaR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [5.0, 5.36], [6.0, 6.56], [11.0, 11.16], [20.0, 20.63], [22.0, 22.08], [27.0, 27.45], [28.0, 28.86], [45.0, 45.57], [47.0, 46.75], [55.0, 58.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["vehicle", 20.66], ["car", 13.55], ["noise", 7.39]]], "duration": [0.98, 0.36, 0.56, 0.16, 0.63, 0.08, 0.45, 0.86, 0.57, -0.25, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/003kLKX8n3E_filtered.json b/annotations_filtered/003kLKX8n3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..874dd3b54d5dbcfecaac8dc454d0c2d2077b229f --- /dev/null +++ b/annotations_filtered/003kLKX8n3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [4.0, 4.38], [5.0, 5.81], [6.0, 11.26], [12.0, 13.05], [14.0, 14.54], [16.0, 32.24], [33.0, 34.59], [37.0, 43.11], [46.0, 48.96], [55.0, 55.9], [57.0, 60.0], [60.0, 61.18], [62.0, 63.81], [66.0, 66.51], [68.0, 76.81], [77.0, 76.96], [77.0, 80.27], [81.0, 87.34], [89.0, 89.53], [90.0, 90.17], [91.0, 91.45], [92.0, 92.25], [93.0, 92.91], [94.0, 95.18], [96.0, 99.49], [100.0, 100.11], [100.0, 101.36], [102.0, 105.44], [106.0, 107.76], [109.0, 112.04], [113.0, 115.4], [117.0, 118.49], [120.0, 120.28], [121.0, 121.44], [122.0, 122.66], [123.0, 123.28], [125.0, 124.88], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 40.68, 0.0, 58.13, 75.55, 0.0, 57.4, 0.0, 0.0, 0.0, 51.23, 0.0, 70.86, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 64.52, 0.0, 56.18, 56.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 64.46], ["didgeridoo", 8.5], ["musical instrument", 5.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.04], ["hum", 12.35], ["throbbing", 6.37]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 0.38, 0.81, 5.26, 1.05, 0.54, 16.24, 1.59, 6.11, 2.96, 0.9, 3.0, 1.18, 1.81, 0.51, 8.81, -0.04, 3.27, 6.34, 0.53, 0.17, 0.45, 0.25, -0.09, 1.18, 3.49, 0.11, 1.36, 3.44, 1.76, 3.04, 2.4, 1.49, 0.28, 0.44, 0.66, 0.28, -0.12, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/009tNfQRd4o_filtered.json b/annotations_filtered/009tNfQRd4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4f1de1f2d77b4340aa4d854741ff38b2deb720 --- /dev/null +++ b/annotations_filtered/009tNfQRd4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.39], [35.0, 35.51], [54.0, 54.58], [56.0, 56.1], [58.0, 58.48], [63.0, 64.3], [68.0, 68.76], [74.0, 73.84], [77.0, 76.72], [91.0, 90.61], [96.0, 96.09], [98.0, 97.97], [104.0, 104.55], [108.0, 108.28], [112.0, 113.44], [116.0, 116.41], [126.0, 128.97], [130.0, 131.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.26, 0.0], "audiomae_on_audioset": [[["music", 63.22], ["musical instrument", 6.87], ["clarinet", 4.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.69], ["didgeridoo", 8.81], ["theremin", 6.4]], null], "duration": [9.39, 0.51, 0.58, 0.1, 0.48, 1.3, 0.76, -0.16, -0.28, -0.39, 0.09, -0.03, 0.55, 0.28, 1.44, 0.41, 2.97, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/00I2Ofraf4A_filtered.json b/annotations_filtered/00I2Ofraf4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6df123e279367eff241e442e2cedb3038aae2ab0 --- /dev/null +++ b/annotations_filtered/00I2Ofraf4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [10.0, 21.51], [22.0, 22.4], [24.0, 24.7], [25.0, 30.84], [32.0, 33.93], [34.0, 35.92], [36.0, 37.25], [40.0, 42.47], [43.0, 47.21], [49.0, 50.43], [53.0, 57.7], [62.0, 62.43], [65.0, 75.15], [78.0, 82.0], [86.0, 92.55], [98.0, 98.39], [99.0, 99.98], [105.0, 106.22], [111.0, 113.86], [114.0, 122.94], [125.0, 140.32], [142.0, 142.25]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [41.2, 28.54, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 54.36, 51.44, 0.0, 44.93, 0.0, 52.98, 55.11, 38.32, 0.0, 0.0, 0.0, 47.43, 39.94, 37.8, 0.0], "audiomae_on_audioset": [[["mechanical fan", 18.59], ["mains hum", 14.19], ["hum", 8.8]], [["music", 21.94], ["hum", 10.94], ["throbbing", 9.6]], null, null, [["sidetone", 40.89], ["speech", 37.8], ["music", 6.72]], null, null, null, null, null, null, [["sidetone", 43.6], ["speech", 20.46], ["hum", 6.8]], null, null, null, [["speech", 23.75], ["fly, housefly", 23.68], ["insect", 18.5]], null, null, null, [["speech", 20.82], ["hum", 18.78], ["rumble", 8.39]], [["speech", 64.62], ["music", 11.96], ["sidetone", 6.08]], [["speech", 56.82], ["hum", 16.89], ["sidetone", 7.17]], null], "duration": [2.25, 11.51, 0.4, 0.7, 5.84, 1.93, 1.92, 1.25, 2.47, 4.21, 1.43, 4.7, 0.43, 10.15, 4.0, 6.55, 0.39, 0.98, 1.22, 2.86, 8.94, 15.32, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/00QMS3Ldb20_filtered.json b/annotations_filtered/00QMS3Ldb20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd3038db201e628e85e91f1bde4d7abd4f71f44a --- /dev/null +++ b/annotations_filtered/00QMS3Ldb20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 57.5], [58.0, 59.88], [61.0, 64.22], [65.0, 65.91], [67.0, 70.65], [71.0, 73.95], [76.0, 105.14], [106.0, 136.36], [139.0, 156.24], [159.0, 203.03], [204.0, 204.42], [207.0, 209.16], [211.0, 215.13]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [29.2, 0.0, 29.97, 0.0, 29.52, 28.74, 28.53, 0.0, 28.74, 0.0, 0.0, 38.43, 33.42], "audiomae_on_audioset": [[["music", 53.55], ["speech", 21.69], ["hum", 4.38]], null, [["music", 25.39], ["hum", 17.56], ["mains hum", 16.62]], null, [["speech", 45.16], ["music", 44.0], ["musical instrument", 2.37]], [["throbbing", 30.63], ["music", 27.0], ["hum", 21.52]], [["music", 58.26], ["musical instrument", 11.4], ["effects unit", 2.72]], null, [["music", 46.43], ["mains hum", 17.38], ["hum", 5.1]], null, null, [["hum", 37.84], ["mains hum", 18.79], ["throbbing", 5.32]], [["hum", 45.32], ["mains hum", 18.49], ["throbbing", 9.37]]], "duration": [7.5, 1.88, 3.22, 0.91, 3.65, 2.95, 29.14, 30.36, 17.24, 44.03, 0.42, 2.16, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/00rpUGdvcY0_filtered.json b/annotations_filtered/00rpUGdvcY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae0336c9c6c0715469ded48b6df95c7cf663cdc --- /dev/null +++ b/annotations_filtered/00rpUGdvcY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 24.24], [28.0, 30.86], [38.0, 60.07], [61.0, 68.28], [73.0, 77.21], [78.0, 80.38], [88.0, 95.98], [97.0, 100.62]], "keep_status": [false, false, true, false, true, true, false, true], "silence_prob": [31.27, 30.37, 31.14, 31.47, 32.37, 30.23, 31.73, 36.17], "audiomae_on_audioset": [[["music", 63.73], ["smash, crash", 5.77], ["cacophony", 4.25]], [["music", 64.9], ["musical instrument", 5.34], ["smash, crash", 2.89]], [["music", 46.23], ["didgeridoo", 12.01], ["theremin", 10.29]], [["speech", 45.81], ["music", 21.66], ["thunk", 12.73]], [["music", 36.27], ["breaking", 16.28], ["smash, crash", 14.16]], [["music", 34.33], ["breaking", 27.74], ["crack", 4.61]], [["music", 55.63], ["hum", 10.76], ["mains hum", 4.77]], [["music", 51.15], ["fart", 6.72], ["musical instrument", 4.45]]], "duration": [14.24, 2.86, 22.07, 7.28, 4.21, 2.38, 7.98, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/01ClRWyf9I4_filtered.json b/annotations_filtered/01ClRWyf9I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aa77b417f825a4fbf30e6763521fcc058a3bee2 --- /dev/null +++ b/annotations_filtered/01ClRWyf9I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [2.0, 2.79], [5.0, 12.55], [13.0, 18.15], [20.0, 27.84], [29.0, 30.69], [31.0, 31.41], [33.0, 43.26], [49.0, 66.55], [68.0, 71.74], [73.0, 80.43], [81.0, 84.55], [85.0, 92.4], [95.0, 100.79], [104.0, 107.86], [110.0, 110.88], [113.0, 114.18], [122.0, 133.86], [135.0, 136.63], [140.0, 142.37], [144.0, 147.16], [148.0, 150.03], [152.0, 154.04], [157.0, 157.81], [162.0, 165.55], [168.0, 184.4], [186.0, 201.11], [204.0, 209.68], [210.0, 232.68], [234.0, 239.87], [241.0, 253.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.65, 81.71, 99.31, 0.0, 0.0, 83.88, 40.95, 80.82, 91.64, 78.89, 87.19, 89.01, 92.97, 0.0, 0.0, 91.3, 0.0, 75.55, 91.64, 89.01, 93.6, 0.0, 94.81, 83.52, 56.93, 58.64, 39.05, 88.64, 92.64], "audiomae_on_audioset": [null, null, [["music", 72.43], ["plucked string instrument", 2.37], ["guitar", 2.31]], null, null, null, null, null, [["music", 57.53], ["theremin", 18.38], ["whale vocalization", 8.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.77], ["scary music", 3.53], ["theremin", 2.28]], null, null], "duration": [1.0, 0.79, 7.55, 5.15, 7.84, 1.69, 0.41, 10.26, 17.55, 3.74, 7.43, 3.55, 7.4, 5.79, 3.86, 0.88, 1.18, 11.86, 1.63, 2.37, 3.16, 2.03, 2.04, 0.81, 3.55, 16.4, 15.11, 5.68, 22.68, 5.87, 12.86]} \ No newline at end of file diff --git a/annotations_filtered/01OfrTMVeD8_filtered.json b/annotations_filtered/01OfrTMVeD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3068501a9e3522b7cda2ca719f86b1b3b6b38e8 --- /dev/null +++ b/annotations_filtered/01OfrTMVeD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [6.0, 5.81], [7.0, 8.5], [11.0, 12.55], [14.0, 15.23], [17.0, 17.86], [19.0, 19.18], [20.0, 21.46], [23.0, 24.24], [25.0, 25.52], [27.0, 28.07], [31.0, 31.55], [33.0, 33.47], [36.0, 36.19], [38.0, 37.89], [39.0, 39.07], [41.0, 42.35], [43.0, 43.98], [45.0, 46.18], [48.0, 48.17], [49.0, 49.59], [51.0, 52.42], [53.0, 53.3], [54.0, 55.17], [58.0, 57.96], [60.0, 60.94], [64.0, 64.62], [66.0, 66.36], [68.0, 68.0], [70.0, 70.09], [72.0, 71.68], [74.0, 74.36], [78.0, 78.29], [80.0, 80.28], [83.0, 84.03], [85.0, 85.67], [87.0, 87.13], [89.0, 88.86], [91.0, 91.93], [94.0, 94.53], [96.0, 96.8], [97.0, 97.65], [102.0, 103.55], [105.0, 106.25], [107.0, 107.86], [109.0, 109.27], [110.0, 111.21], [113.0, 114.76], [117.0, 117.34], [119.0, 120.45], [121.0, 121.93], [124.0, 124.31], [126.0, 127.3], [128.0, 128.53], [130.0, 131.13], [134.0, 134.81], [135.0, 135.46], [137.0, 136.95], [140.0, 140.88], [144.0, 144.15], [147.0, 147.33], [152.0, 151.82], [153.0, 154.4], [162.0, 163.16], [164.0, 164.81], [165.0, 165.77], [167.0, 167.27], [169.0, 169.11], [170.0, 169.94], [172.0, 172.15], [174.0, 174.82], [175.0, 175.8], [178.0, 178.92], [180.0, 181.72], [183.0, 187.0], [188.0, 188.64], [191.0, 191.98], [194.0, 195.07], [196.0, 196.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.06, -0.19, 1.5, 1.55, 1.23, 0.86, 0.18, 1.46, 1.24, 0.52, 1.07, 0.55, 0.47, 0.19, -0.11, 0.07, 1.35, 0.98, 1.18, 0.17, 0.59, 1.42, 0.3, 1.17, -0.04, 0.94, 0.62, 0.36, 0.0, 0.09, -0.32, 0.36, 0.29, 0.28, 1.03, 0.67, 0.13, -0.14, 0.93, 0.53, 0.8, 0.65, 1.55, 1.25, 0.86, 0.27, 1.21, 1.76, 0.34, 1.45, 0.93, 0.31, 1.3, 0.53, 1.13, 0.81, 0.46, -0.05, 0.88, 0.15, 0.33, -0.18, 1.4, 1.16, 0.81, 0.77, 0.27, 0.11, -0.06, 0.15, 0.82, 0.8, 0.92, 1.72, 4.0, 0.64, 0.98, 1.07, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/01RWw-3AKaE_filtered.json b/annotations_filtered/01RWw-3AKaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/01RWw-3AKaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/01ZWXIY1mcs_filtered.json b/annotations_filtered/01ZWXIY1mcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5b79802b3627aea8a78c5b108bba02d064d5e42 --- /dev/null +++ b/annotations_filtered/01ZWXIY1mcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.75], [10.0, 10.69], [11.0, 29.0], [31.0, 31.83], [34.0, 43.8], [46.0, 90.88]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 35.06, 0.0, 33.41, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 50.65], ["music", 12.04], ["throbbing", 6.76]], null, [["music", 47.13], ["gong", 20.76], ["timpani", 7.14]], null], "duration": [0.75, 0.69, 18.0, 0.83, 9.8, 44.88]} \ No newline at end of file diff --git a/annotations_filtered/01ovMSvDohw_filtered.json b/annotations_filtered/01ovMSvDohw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d7cada691a5c3a9aeaf2c77b2b451948bf52ca --- /dev/null +++ b/annotations_filtered/01ovMSvDohw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 33.02], [35.0, 35.73], [36.0, 65.1], [65.0, 80.08], [81.0, 81.82], [82.0, 86.78], [88.0, 88.28], [89.0, 89.36], [90.0, 92.67], [94.0, 94.14], [94.0, 95.17], [96.0, 96.57], [98.0, 99.74], [102.0, 104.99]], "keep_status": [true, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [42.11, 0.0, 33.29, 34.92, 0.0, 37.06, 0.0, 0.0, 36.53, 0.0, 0.0, 0.0, 0.0, 51.82], "audiomae_on_audioset": [[["speech", 28.06], ["hum", 17.86], ["music", 9.98]], null, [["music", 48.39], ["speech", 10.94], ["buzz", 4.4]], [["speech", 57.0], ["music", 14.08], ["electric shaver, electric razor", 6.24]], null, [["speech", 20.12], ["hum", 6.43], ["horse", 5.42]], null, null, [["speech", 27.23], ["insect", 11.54], ["bee, wasp, etc.", 11.19]], null, null, null, null, null], "duration": [12.02, 0.73, 29.1, 15.08, 0.82, 4.78, 0.28, 0.36, 2.67, 0.14, 1.17, 0.57, 1.74, 2.99]} \ No newline at end of file diff --git a/annotations_filtered/01qhgR0WsnA_filtered.json b/annotations_filtered/01qhgR0WsnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aa6304f1fc33b212a59296f9a346d8afc9a5402 --- /dev/null +++ b/annotations_filtered/01qhgR0WsnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 38.45], [38.0, 48.96], [52.0, 52.74], [55.0, 92.96], [97.0, 97.78], [100.0, 113.44], [116.0, 141.96]], "keep_status": [false, true, false, false, false, true, true], "silence_prob": [0.0, 32.06, 0.0, 0.0, 0.0, 31.08, 30.85], "audiomae_on_audioset": [null, [["music", 28.72], ["speech", 21.6], ["hum", 18.25]], null, null, null, [["speech", 29.02], ["buzz", 19.39], ["music", 16.9]], [["music", 28.64], ["throbbing", 10.14], ["hum", 9.47]]], "duration": [36.45, 10.96, 0.74, 37.96, 0.78, 13.44, 25.96]} \ No newline at end of file diff --git a/annotations_filtered/02064E1SHtQ_filtered.json b/annotations_filtered/02064E1SHtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa3f7cc9fb509a8d70b2bb8054aedb1bcdf781a --- /dev/null +++ b/annotations_filtered/02064E1SHtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.08], [27.0, 28.63], [31.0, 31.82], [33.0, 34.69], [36.0, 37.05], [40.0, 41.44], [46.0, 48.88], [51.0, 90.36], [94.0, 95.2], [98.0, 98.9], [100.0, 103.47], [104.0, 105.33], [106.0, 106.3], [107.0, 108.77], [109.0, 110.86], [111.0, 115.84], [118.0, 126.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 1.63, 0.82, 1.69, 1.05, 1.44, 2.88, 39.36, 1.2, 0.9, 3.47, 1.33, 0.3, 1.77, 1.86, 4.84, 8.4]} \ No newline at end of file diff --git a/annotations_filtered/029Mdp9jYiY_filtered.json b/annotations_filtered/029Mdp9jYiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49c744263423fffa3453576bec867a950ae39621 --- /dev/null +++ b/annotations_filtered/029Mdp9jYiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [5.0, 12.24], [14.0, 15.04], [16.0, 16.9], [17.0, 20.87], [21.0, 22.18], [23.0, 26.62], [27.0, 31.65], [34.0, 34.25], [35.0, 36.0], [37.0, 38.18], [39.0, 39.29], [40.0, 42.55], [43.0, 53.43], [55.0, 56.3], [58.0, 65.31], [67.0, 69.67], [71.0, 72.33], [74.0, 80.82], [83.0, 83.39], [84.0, 85.82], [89.0, 89.85], [94.0, 98.25], [99.0, 118.13], [120.0, 133.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.04, 0.0, 0.0, 79.76, 0.0, 97.22, 98.99, 0.0, 0.0, 0.0, 0.0, 99.96, 96.77, 0.0, 99.82, 99.36, 0.0, 99.62, 0.0, 0.0, 0.0, 99.62, 91.98, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 7.24, 1.04, 0.9, 3.87, 1.18, 3.62, 4.65, 0.25, 1.0, 1.18, 0.29, 2.55, 10.43, 1.3, 7.31, 2.67, 1.33, 6.82, 0.39, 1.82, 0.85, 4.25, 19.13, 13.71]} \ No newline at end of file diff --git a/annotations_filtered/02A2a-aEvmI_filtered.json b/annotations_filtered/02A2a-aEvmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db7da1e7bfcebe64c30dacd0bbd5642c8dd56900 --- /dev/null +++ b/annotations_filtered/02A2a-aEvmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [4.0, 4.33], [7.0, 7.33], [16.0, 17.19], [18.0, 18.35], [19.0, 20.8], [22.0, 22.52], [25.0, 28.24], [29.0, 30.43], [31.0, 31.77], [38.0, 43.04], [46.0, 46.63], [47.0, 48.98], [50.0, 49.89], [51.0, 51.58], [54.0, 54.7], [56.0, 55.8], [56.0, 55.98], [70.0, 72.27], [73.0, 73.08], [74.0, 74.61], [75.0, 74.66], [75.0, 75.37], [75.0, 75.57], [79.0, 79.86], [81.0, 80.59], [81.0, 80.65], [81.0, 81.89], [84.0, 84.06], [85.0, 85.01], [86.0, 88.37], [89.0, 88.87], [91.0, 90.81], [91.0, 94.68], [98.0, 98.14], [98.0, 98.17], [98.0, 99.72], [100.0, 101.9], [104.0, 104.46], [108.0, 108.72], [119.0, 119.23], [127.0, 128.43], [130.0, 132.31], [132.0, 132.53], [137.0, 138.79], [157.0, 157.52], [174.0, 174.33], [176.0, 177.13], [180.0, 180.47], [186.0, 186.56], [202.0, 202.04], [204.0, 204.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 0.0, 0.0, 36.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.28, 0.0, 0.0, 31.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 66.46], ["effects unit", 8.58], ["distortion", 4.68]], null, null, [["hum", 37.08], ["mains hum", 24.71], ["music", 11.21]], null, null, null, null, null, null, null, [["music", 21.35], ["whale vocalization", 9.24], ["theremin", 7.88]], null, null, null, null, null, null, null, null, null, null, null, [["radio", 48.02], ["speech", 46.87], ["telephone", 0.95]], null, null, [["radio", 61.6], ["speech", 30.85], ["sidetone", 2.92]], null, null, null, null, null, null, null, null, [["radio", 49.37], ["speech", 39.15], ["sidetone", 6.91]], null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.33, 0.33, 1.19, 0.35, 1.8, 0.52, 3.24, 1.43, 0.77, 5.04, 0.63, 1.98, -0.11, 0.58, 0.7, -0.2, -0.02, 2.27, 0.08, 0.61, -0.34, 0.37, 0.57, 0.86, -0.41, -0.35, 0.89, 0.06, 0.01, 2.37, -0.13, -0.19, 3.68, 0.14, 0.17, 1.72, 1.9, 0.46, 0.72, 0.23, 1.43, 2.31, 0.53, 1.79, 0.52, 0.33, 1.13, 0.47, 0.56, 0.04, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/02AyhONR_DQ_filtered.json b/annotations_filtered/02AyhONR_DQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec3c95032f54146d85087db81e27881cd3a342d1 --- /dev/null +++ b/annotations_filtered/02AyhONR_DQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [7.0, 7.37], [8.0, 8.41], [15.0, 20.33], [28.0, 27.99], [32.0, 32.71], [35.0, 35.46], [37.0, 38.15], [38.0, 40.34], [43.0, 44.59], [45.0, 46.36], [51.0, 58.24], [60.0, 76.01], [76.0, 76.45], [77.0, 100.4], [105.0, 106.52], [113.0, 113.71], [115.0, 115.94], [118.0, 118.44], [119.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 35.1, 0.0, 0.0, 0.0, 0.0, 42.06, 0.0, 0.0, 42.74, 39.05, 0.0, 31.44, 0.0, 0.0, 0.0, 0.0, 41.36], "audiomae_on_audioset": [null, null, null, [["speech", 47.38], ["music", 24.17], ["animal", 8.14]], null, null, null, null, [["music", 28.5], ["burping, eructation", 22.16], ["effects unit", 14.45]], null, null, [["animal", 38.69], ["music", 23.98], ["dog", 9.46]], [["animal", 24.79], ["ding", 10.85], ["music", 10.73]], null, [["music", 67.66], ["electronic music", 5.3], ["boing", 5.22]], null, null, null, null, [["music", 38.73], ["musical instrument", 6.99], ["effects unit", 6.34]]], "duration": [0.04, 0.37, 0.41, 5.33, -0.01, 0.71, 0.46, 1.15, 2.34, 1.59, 1.36, 7.24, 16.01, 0.45, 23.4, 1.52, 0.71, 0.94, 0.44, 2.54]} \ No newline at end of file diff --git a/annotations_filtered/02DzpeBF4es_filtered.json b/annotations_filtered/02DzpeBF4es_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..534e61aee10a872e4dad382bd01fffb5298c22fe --- /dev/null +++ b/annotations_filtered/02DzpeBF4es_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [4.0, 5.34], [7.0, 7.25], [9.0, 9.73], [13.0, 13.31], [20.0, 21.22], [23.0, 23.65], [25.0, 25.54], [26.0, 26.74], [28.0, 31.56], [32.0, 32.88], [36.0, 36.69], [40.0, 42.33], [48.0, 48.24], [55.0, 56.79], [65.0, 64.91], [66.0, 67.49], [71.0, 71.47], [79.0, 80.7], [84.0, 85.7], [86.0, 92.48], [97.0, 98.37], [101.0, 101.29], [105.0, 106.2], [108.0, 108.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.34, 0.25, 0.73, 0.31, 1.22, 0.65, 0.54, 0.74, 3.56, 0.88, 0.69, 2.33, 0.24, 1.79, -0.09, 1.49, 0.47, 1.7, 1.7, 6.48, 1.37, 0.29, 1.2, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/02Or-Hx3yqc_filtered.json b/annotations_filtered/02Or-Hx3yqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f08e073c95b50b4945a14192a91af76417224a0 --- /dev/null +++ b/annotations_filtered/02Or-Hx3yqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [10.0, 14.27], [15.0, 17.9], [21.0, 21.09], [22.0, 23.67], [26.0, 26.69], [31.0, 31.06], [52.0, 53.22], [57.0, 57.97], [63.0, 76.08], [79.0, 81.58], [83.0, 83.86], [86.0, 98.54], [99.0, 100.62], [101.0, 105.75], [106.0, 109.53], [110.0, 113.27], [114.0, 115.77], [117.0, 117.96], [119.0, 119.8], [120.0, 125.96], [126.0, 126.98]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.5, 30.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.62, 36.17, 0.0, 55.46, 0.0, 59.42, 57.97, 76.37, 0.0, 0.0, 0.0, 46.54, 0.0], "audiomae_on_audioset": [null, [["speech", 49.9], ["music", 13.08], ["hum", 6.32]], [["music", 32.64], ["speech", 12.52], ["bow-wow", 4.51]], null, null, null, null, null, null, [["mains hum", 52.12], ["hum", 21.12], ["speech", 12.05]], [["fart", 17.55], ["music", 11.33], ["creak", 7.07]], null, null, null, null, null, null, null, null, null, [["speech", 56.14], ["mains hum", 10.2], ["telephone", 7.34]], null], "duration": [0.22, 4.27, 2.9, 0.09, 1.67, 0.69, 0.06, 1.22, 0.97, 13.08, 2.58, 0.86, 12.54, 1.62, 4.75, 3.53, 3.27, 1.77, 0.96, 0.8, 5.96, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/03L12Mqkzg8_filtered.json b/annotations_filtered/03L12Mqkzg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b47e9a8c47a6ab852d9dcae01ec03ff3caf2df1f --- /dev/null +++ b/annotations_filtered/03L12Mqkzg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.16], [23.0, 29.93], [31.0, 32.36], [34.0, 38.26], [39.0, 40.51], [41.0, 56.47], [59.0, 60.39], [62.0, 62.67], [65.0, 64.74], [66.0, 82.46], [84.0, 84.25], [86.0, 87.1], [88.0, 93.85], [96.0, 106.32], [107.0, 108.23], [110.0, 111.89], [115.0, 117.42]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 99.98, 0.0, 48.95, 0.0, 39.12, 0.0, 0.0, 0.0, 33.05, 0.0, 0.0, 44.63, 32.7, 0.0, 0.0, 36.34], "audiomae_on_audioset": [null, null, null, [["music", 33.34], ["speech", 23.71], ["musical instrument", 7.33]], null, [["music", 51.48], ["speech", 7.18], ["musical instrument", 5.96]], null, null, null, [["music", 37.94], ["synthesizer", 28.54], ["hum", 7.21]], null, null, [["music", 65.44], ["synthesizer", 9.84], ["drum machine", 6.67]], [["music", 64.75], ["speech", 9.08], ["throbbing", 3.92]], null, null, [["hum", 32.7], ["mains hum", 25.97], ["music", 13.33]]], "duration": [2.16, 6.93, 1.36, 4.26, 1.51, 15.47, 1.39, 0.67, -0.26, 16.46, 0.25, 1.1, 5.85, 10.32, 1.23, 1.89, 2.42]} \ No newline at end of file diff --git a/annotations_filtered/03NoI9KiZOk_filtered.json b/annotations_filtered/03NoI9KiZOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..798f30fdd09ad0ee6997faf7bad7b8c5d3a7a9b6 --- /dev/null +++ b/annotations_filtered/03NoI9KiZOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [9.0, 10.13], [13.0, 14.39], [16.0, 22.18], [26.0, 31.78], [32.0, 34.7], [35.0, 36.15], [36.0, 37.07], [38.0, 39.24], [40.0, 43.01], [45.0, 45.12], [48.0, 48.71], [50.0, 50.48], [52.0, 52.79], [59.0, 62.23], [65.0, 65.75], [73.0, 74.06], [77.0, 76.77], [80.0, 84.38], [86.0, 87.34], [88.0, 91.54], [96.0, 97.06], [99.0, 100.31], [102.0, 102.42], [105.0, 105.7], [107.0, 107.6], [110.0, 110.76], [115.0, 119.2], [119.0, 119.35], [119.0, 119.45], [120.0, 119.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 98.73, 99.94, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 81.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.13, 1.39, 6.18, 5.78, 2.7, 1.15, 1.07, 1.24, 3.01, 0.12, 0.71, 0.48, 0.79, 3.23, 0.75, 1.06, -0.23, 4.38, 1.34, 3.54, 1.06, 1.31, 0.42, 0.7, 0.6, 0.76, 4.2, 0.35, 0.45, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/03QHVB_n6N8_filtered.json b/annotations_filtered/03QHVB_n6N8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73d959f43fb115c7f5ea8b169cb7e0fcd71e5f21 --- /dev/null +++ b/annotations_filtered/03QHVB_n6N8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.7], [5.0, 5.64], [7.0, 7.21], [8.0, 8.68], [10.0, 11.35], [15.0, 15.01], [24.0, 25.56], [50.0, 49.91], [51.0, 51.31], [52.0, 52.98], [61.0, 61.87], [62.0, 63.58], [65.0, 66.87], [71.0, 74.33], [79.0, 84.1], [101.0, 104.43], [108.0, 107.81], [110.0, 109.76], [113.0, 115.79], [117.0, 117.49], [118.0, 119.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.4, 44.29, 57.17, 0.0, 0.0, 50.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.33], ["livestock, farm animals, working animals", 8.76], ["honk", 8.07]], [["music", 51.62], ["didgeridoo", 14.47], ["speech", 10.27]], null, null, null, null, null, null], "duration": [0.7, 0.64, 0.21, 0.68, 1.35, 0.01, 1.56, -0.09, 0.31, 0.98, 0.87, 1.58, 1.87, 3.33, 5.1, 3.43, -0.19, -0.24, 2.79, 0.49, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/03Rl5exupSo_filtered.json b/annotations_filtered/03Rl5exupSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deb51660d3badf6a2c1eec16b520359bc103663c --- /dev/null +++ b/annotations_filtered/03Rl5exupSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.03], [16.0, 17.36], [18.0, 19.06], [20.0, 20.87], [24.0, 27.9], [29.0, 30.2], [32.0, 32.14], [37.0, 37.64], [41.0, 40.95], [47.0, 46.85], [48.0, 48.07], [49.0, 49.4], [49.0, 49.45], [64.0, 64.03], [65.0, 65.06], [67.0, 66.87], [68.0, 69.13], [70.0, 71.15], [77.0, 77.01], [78.0, 79.56], [80.0, 80.52], [82.0, 83.03], [86.0, 86.53], [88.0, 88.84], [100.0, 101.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.96, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 81.87], ["music", 4.05], ["electric shaver, electric razor", 1.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.03, 1.36, 1.06, 0.87, 3.9, 1.2, 0.14, 0.64, -0.05, -0.15, 0.07, 0.4, 0.45, 0.03, 0.06, -0.13, 1.13, 1.15, 0.01, 1.56, 0.52, 1.03, 0.53, 0.84, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/03WbdaZCGAA_filtered.json b/annotations_filtered/03WbdaZCGAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25194b1a59511da1b916b2e91ec32a9b52b9956a --- /dev/null +++ b/annotations_filtered/03WbdaZCGAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [8.0, 31.95], [33.0, 34.21], [37.0, 49.27], [57.0, 57.28], [58.0, 57.87], [59.0, 67.31], [69.0, 69.25], [72.0, 78.0], [78.0, 78.73], [80.0, 80.01]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 29.55, 0.0, 28.64, 0.0, 0.0, 29.84, 0.0, 28.52, 0.0, 0.0], "audiomae_on_audioset": [null, [["mains hum", 63.04], ["hum", 25.08], ["throbbing", 3.14]], null, [["burst, pop", 22.31], ["explosion", 19.99], ["fireworks", 10.51]], null, null, [["explosion", 35.26], ["speech", 24.99], ["burst, pop", 10.63]], null, [["music", 16.66], ["livestock, farm animals, working animals", 13.5], ["speech", 9.63]], null, null], "duration": [0.5, 23.95, 1.21, 12.27, 0.28, -0.13, 8.31, 0.25, 6.0, 0.73, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/03a-vG6wHDI_filtered.json b/annotations_filtered/03a-vG6wHDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ac1c572c3c23b62496cb22a068a74963df6959 --- /dev/null +++ b/annotations_filtered/03a-vG6wHDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [9.0, 11.16], [12.0, 12.75], [20.0, 21.59], [25.0, 26.08], [26.0, 28.32], [30.0, 30.64], [31.0, 33.56], [35.0, 37.62], [41.0, 42.13], [42.0, 43.14], [43.0, 45.5], [63.0, 83.4], [84.0, 90.26], [92.0, 92.53], [96.0, 96.65], [100.0, 106.81], [113.0, 113.64], [116.0, 116.88], [126.0, 127.47], [134.0, 137.64], [141.0, 142.67], [144.0, 146.8], [148.0, 148.81], [151.0, 151.8], [154.0, 154.75], [159.0, 159.65], [162.0, 164.78], [168.0, 168.4], [171.0, 171.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.67, 0.0, 0.0, 0.0, 53.04, 0.0, 45.78, 89.54, 0.0, 0.0, 56.63, 38.7, 99.93, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 81.71, 0.0, 32.03, 0.0, 0.0, 0.0, 0.0, 34.61, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.69], ["radio", 29.94], ["scratching (performance technique)", 8.77]], null, null, null, null, null, [["speech", 43.77], ["telephone", 30.2], ["inside, small room", 4.83]], null, null, null, null, [["hum", 46.6], ["mains hum", 10.66], ["throbbing", 5.62]], null, null, null, [["speech", 49.61], ["sidetone", 23.54], ["noise", 4.92]], null, null, null, null, null, [["speech", 68.88], ["thunk", 5.52], ["telephone", 2.75]], null, null, null, null, [["speech", 81.1], ["telephone", 4.22], ["busy signal", 2.94]], null, null], "duration": [0.1, 2.16, 0.75, 1.59, 1.08, 2.32, 0.64, 2.56, 2.62, 1.13, 1.14, 2.5, 20.4, 6.26, 0.53, 0.65, 6.81, 0.64, 0.88, 1.47, 3.64, 1.67, 2.8, 0.81, 0.8, 0.75, 0.65, 2.78, 0.4, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/03jGqiF-0Gg_filtered.json b/annotations_filtered/03jGqiF-0Gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b86eaf58a5148e20921cc3fb469ede5575284d --- /dev/null +++ b/annotations_filtered/03jGqiF-0Gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.4], [6.0, 9.34], [11.0, 16.11], [17.0, 18.6], [21.0, 23.14], [24.0, 25.39], [26.0, 29.05], [33.0, 33.07], [37.0, 37.5], [52.0, 58.02]], "keep_status": [false, true, true, false, true, false, true, false, false, true], "silence_prob": [64.63, 40.26, 46.54, 0.0, 48.91, 0.0, 49.4, 0.0, 0.0, 37.85], "audiomae_on_audioset": [null, [["sidetone", 37.46], ["music", 10.98], ["speech", 10.23]], [["fly, housefly", 26.41], ["insect", 13.93], ["hum", 9.34]], null, [["music", 24.91], ["hum", 12.38], ["throbbing", 6.21]], null, [["hum", 25.63], ["music", 12.27], ["throbbing", 6.23]], null, null, [["mains hum", 23.56], ["hum", 15.96], ["noise", 12.73]]], "duration": [2.4, 3.34, 5.11, 1.6, 2.14, 1.39, 3.05, 0.07, 0.5, 6.02]} \ No newline at end of file diff --git a/annotations_filtered/03uEq5dKcFs_filtered.json b/annotations_filtered/03uEq5dKcFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2599b8de1eb9e3e75038b7c243667c15ef68e4 --- /dev/null +++ b/annotations_filtered/03uEq5dKcFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.47], [15.0, 15.3], [19.0, 27.03], [32.0, 33.52], [34.0, 33.81], [34.0, 34.92], [36.0, 36.19], [38.0, 38.37], [39.0, 39.77], [41.0, 42.13], [47.0, 47.92], [49.0, 49.55], [50.0, 51.26], [52.0, 52.42], [54.0, 53.94], [56.0, 58.01], [59.0, 59.12], [65.0, 65.38], [69.0, 70.78], [73.0, 75.1], [78.0, 78.04], [87.0, 87.03], [89.0, 91.1], [93.0, 93.72], [100.0, 100.38], [106.0, 106.3], [116.0, 118.18], [123.0, 123.87], [125.0, 125.24], [126.0, 144.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 92.8], "audiomae_on_audioset": [null, null, [["speech", 90.01], ["radio", 1.0], ["inside, small room", 0.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.3, 8.03, 1.52, -0.19, 0.92, 0.19, 0.37, 0.77, 1.13, 0.92, 0.55, 1.26, 0.42, -0.06, 2.01, 0.12, 0.38, 1.78, 2.1, 0.04, 0.03, 2.1, 0.72, 0.38, 0.3, 2.18, 0.87, 0.24, 18.0]} \ No newline at end of file diff --git a/annotations_filtered/049R_wOazQI_filtered.json b/annotations_filtered/049R_wOazQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547a683cd7c203553a95cbbc29ed8c413697ec2b --- /dev/null +++ b/annotations_filtered/049R_wOazQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.19], [17.0, 17.27], [19.0, 21.86], [23.0, 24.04], [27.0, 27.92], [29.0, 29.62], [30.0, 33.56], [35.0, 35.75], [37.0, 61.16], [62.0, 62.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.42, 0.0, 98.01, 0.0, 0.0, 0.0, 100.0, 0.0, 80.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [9.19, 0.27, 2.86, 1.04, 0.92, 0.62, 3.56, 0.75, 24.16, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/04BZh6E-Nck_filtered.json b/annotations_filtered/04BZh6E-Nck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4affe94653dc379d934772c0a3e933f38eaddcb --- /dev/null +++ b/annotations_filtered/04BZh6E-Nck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [8.0, 9.31], [15.0, 15.6], [17.0, 18.54], [21.0, 21.68], [23.0, 47.9], [50.0, 50.38], [60.0, 62.26], [63.0, 64.47], [65.0, 66.8], [68.0, 77.09], [80.0, 94.54], [96.0, 100.43], [101.0, 101.9], [110.0, 125.56], [126.0, 127.06], [128.0, 136.44], [150.0, 149.67], [153.0, 154.43]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.01, 0.0, 45.27, 0.0, 0.0, 28.97, 32.2, 52.45, 0.0, 29.77, 0.0, 29.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 38.43], ["music", 17.54], ["mains hum", 6.22]], null, [["music", 78.38], ["video game music", 3.01], ["soundtrack music", 2.47]], null, null, [["music", 62.46], ["synthesizer", 8.26], ["musical instrument", 2.95]], [["throbbing", 43.91], ["hum", 24.76], ["music", 22.28]], null, null, [["music", 53.11], ["speech", 14.69], ["throbbing", 9.0]], null, [["cattle, bovinae", 22.69], ["livestock, farm animals, working animals", 21.94], ["music", 15.8]], null, null], "duration": [0.87, 1.31, 0.6, 1.54, 0.68, 24.9, 0.38, 2.26, 1.47, 1.8, 9.09, 14.54, 4.43, 0.9, 15.56, 1.06, 8.44, -0.33, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/04s96zDt1RE_filtered.json b/annotations_filtered/04s96zDt1RE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e11539c893c6927987968c9b66f0c30e25160a1 --- /dev/null +++ b/annotations_filtered/04s96zDt1RE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.1], [5.0, 6.78], [9.0, 10.17], [11.0, 12.77], [15.0, 14.96], [16.0, 17.29], [19.0, 19.48], [20.0, 40.98], [43.0, 51.68], [53.0, 63.63], [66.0, 82.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 98.99, 63.42, 35.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 41.05], ["hum", 17.51], ["throbbing", 12.6]]], "duration": [2.1, 1.78, 1.17, 1.77, -0.04, 1.29, 0.48, 20.98, 8.68, 10.63, 16.36]} \ No newline at end of file diff --git a/annotations_filtered/04uN57jOg-Q_filtered.json b/annotations_filtered/04uN57jOg-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a74e8f0afa4bd1de29e995537c0e4192785e243 --- /dev/null +++ b/annotations_filtered/04uN57jOg-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.74], [11.0, 12.39], [13.0, 13.0], [14.0, 14.86], [21.0, 21.69], [29.0, 30.16], [43.0, 43.9], [45.0, 44.59], [45.0, 46.25], [73.0, 74.73], [83.0, 86.44], [96.0, 109.31], [112.0, 113.58], [124.0, 125.79], [130.0, 131.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 89.01, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 1.39, 0.0, 0.86, 0.69, 1.16, 0.9, -0.41, 1.25, 1.73, 3.44, 13.31, 1.58, 1.79, 1.85]} \ No newline at end of file diff --git a/annotations_filtered/04xSMg03sZ0_filtered.json b/annotations_filtered/04xSMg03sZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6acf2d8cb55a7d9f7a8f9f011f402720a7d5e872 --- /dev/null +++ b/annotations_filtered/04xSMg03sZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.26], [8.0, 8.29], [11.0, 13.73], [18.0, 25.91], [31.0, 32.29], [33.0, 34.18], [36.0, 46.14], [47.0, 49.3], [51.0, 51.09], [54.0, 55.32], [57.0, 58.13], [59.0, 60.37], [61.0, 61.77], [62.0, 68.47], [70.0, 72.4], [80.0, 82.66], [92.0, 94.31], [96.0, 99.4], [103.0, 104.38], [105.0, 105.33], [108.0, 108.01], [114.0, 114.13], [117.0, 118.29], [122.0, 121.64], [123.0, 122.61], [126.0, 127.92], [132.0, 132.87]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.99, 0.0, 41.62, 61.47, 0.0, 0.0, 51.39, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 61.77, 31.32, 41.34, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.85], ["speech", 14.12], ["hum", 8.75]], null, [["speech", 16.31], ["radio", 7.13], ["boing", 6.6]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.43], ["speech", 32.67], ["musical instrument", 3.04]], [["music", 45.38], ["breaking", 27.09], ["glass", 12.11]], [["music", 54.27], ["synthesizer", 12.56], ["speech", 9.18]], null, null, null, null, null, null, null, null, null], "duration": [3.26, 0.29, 2.73, 7.91, 1.29, 1.18, 10.14, 2.3, 0.09, 1.32, 1.13, 1.37, 0.77, 6.47, 2.4, 2.66, 2.31, 3.4, 1.38, 0.33, 0.01, 0.13, 1.29, -0.36, -0.39, 1.92, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/04zHzVrubHk_filtered.json b/annotations_filtered/04zHzVrubHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..786b2b718de6844214267795a53e27228ebdd678 --- /dev/null +++ b/annotations_filtered/04zHzVrubHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 48.32], [48.0, 51.92], [53.0, 55.36], [57.0, 58.06], [60.0, 60.88], [62.0, 64.62], [71.0, 72.86], [75.0, 76.74], [77.0, 78.73], [82.0, 82.44], [84.0, 86.61], [88.0, 115.79], [117.0, 118.17], [119.0, 119.64], [121.0, 128.06], [128.0, 130.45], [133.0, 140.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [40.16, 35.16, 34.03, 0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 85.72, 50.81, 0.0, 0.0, 43.79, 34.15, 43.96], "audiomae_on_audioset": [[["hum", 27.26], ["mains hum", 16.03], ["fly, housefly", 11.92]], [["sidetone", 88.18], ["speech", 4.39], ["music", 2.84]], [["speech", 67.32], ["radio", 12.87], ["shuffling cards", 3.56]], null, null, null, null, null, null, null, null, null, null, null, [["echo", 36.12], ["hum", 8.59], ["fart", 7.84]], [["didgeridoo", 17.74], ["music", 14.5], ["theremin", 8.22]], [["music", 45.07], ["sonar", 12.15], ["synthesizer", 10.98]]], "duration": [20.32, 3.92, 2.36, 1.06, 0.88, 2.62, 1.86, 1.74, 1.73, 0.44, 2.61, 27.79, 1.17, 0.64, 7.06, 2.45, 7.44]} \ No newline at end of file diff --git a/annotations_filtered/05-e-YTw4r8_filtered.json b/annotations_filtered/05-e-YTw4r8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a92af022a71e05b848d798b707fba75fca8752cc --- /dev/null +++ b/annotations_filtered/05-e-YTw4r8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.91], [20.0, 20.85], [22.0, 21.81], [23.0, 24.58], [26.0, 27.9], [29.0, 32.61], [33.0, 37.15], [39.0, 42.01], [43.0, 43.65], [44.0, 62.04], [63.0, 64.64], [66.0, 66.38], [69.0, 69.09], [73.0, 75.74], [77.0, 78.83], [85.0, 85.73], [90.0, 92.87], [97.0, 98.04], [101.0, 101.53], [106.0, 116.06], [117.0, 118.12], [119.0, 125.44], [126.0, 129.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 95.64, 79.24, 0.0, 43.4, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 48.78, 0.0, 0.0, 49.4, 0.0, 50.36, 55.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["vehicle", 19.42], ["car", 18.72], ["race car, auto racing", 8.22]], null, null, null, null, null, null, [["eruption", 16.38], ["hum", 15.3], ["gong", 10.61]], null, null, [["sidetone", 62.19], ["hum", 6.88], ["speech", 6.44]], null, null, null], "duration": [0.91, 0.85, -0.19, 1.58, 1.9, 3.61, 4.15, 3.01, 0.65, 18.04, 1.64, 0.38, 0.09, 2.74, 1.83, 0.73, 2.87, 1.04, 0.53, 10.06, 1.12, 6.44, 3.47]} \ No newline at end of file diff --git a/annotations_filtered/056HlHORCIU_filtered.json b/annotations_filtered/056HlHORCIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7ef615d6de9348828f9dfb0ba6dabb7308f1525 --- /dev/null +++ b/annotations_filtered/056HlHORCIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.02], [4.0, 4.58], [7.0, 7.89], [9.0, 10.69], [11.0, 20.46], [21.0, 21.61], [24.0, 28.38], [29.0, 29.3], [32.0, 37.32], [38.0, 48.74]], "keep_status": [false, false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.1, 0.0, 30.59, 0.0, 29.99, 29.66], "audiomae_on_audioset": [null, null, null, null, [["hum", 23.75], ["speech", 21.77], ["mains hum", 14.05]], null, [["music", 49.09], ["buzz", 7.38], ["noise", 4.81]], null, [["music", 14.84], ["cacophony", 12.98], ["synthesizer", 10.44]], [["buzz", 32.4], ["vehicle", 14.19], ["music", 7.63]]], "duration": [1.02, 0.58, 0.89, 1.69, 9.46, 0.61, 4.38, 0.3, 5.32, 10.74]} \ No newline at end of file diff --git a/annotations_filtered/05O77oX6bQE_filtered.json b/annotations_filtered/05O77oX6bQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..285fe4eca836f3060cab02a977d6ff45cd5d707f --- /dev/null +++ b/annotations_filtered/05O77oX6bQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [20.0, 20.83], [24.0, 24.06], [67.0, 67.2], [110.0, 117.75], [120.0, 122.94], [124.0, 125.22], [129.0, 130.72], [132.0, 135.9], [137.0, 139.19], [143.0, 155.83]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.98, 96.66, 0.0, 0.0, 80.64, 93.45, 55.89], "audiomae_on_audioset": [null, null, null, null, [["speech", 10.02], ["crowd", 9.26], ["livestock, farm animals, working animals", 6.91]], null, null, null, null, null, null], "duration": [0.65, 0.83, 0.06, 0.2, 7.75, 2.94, 1.22, 1.72, 3.9, 2.19, 12.83]} \ No newline at end of file diff --git a/annotations_filtered/05foBuX_brU_filtered.json b/annotations_filtered/05foBuX_brU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed002d9c4baaa5e71e6325b96e26e66c3573f8f5 --- /dev/null +++ b/annotations_filtered/05foBuX_brU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [13.0, 13.9], [18.0, 18.18], [19.0, 20.09], [20.0, 20.58], [26.0, 26.05], [32.0, 33.03], [34.0, 34.7], [36.0, 36.71], [42.0, 42.57], [43.0, 44.56], [45.0, 46.14], [46.0, 46.7], [65.0, 66.43], [71.0, 72.0], [73.0, 72.96], [75.0, 76.3], [83.0, 82.88], [84.0, 85.04], [86.0, 86.19], [86.0, 86.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.9, 0.18, 1.09, 0.58, 0.05, 1.03, 0.7, 0.71, 0.57, 1.56, 1.14, 0.7, 1.43, 1.0, -0.04, 1.3, -0.12, 1.04, 0.19, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/05nQ6FtAaYg_filtered.json b/annotations_filtered/05nQ6FtAaYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b699f51fcccf50c312f5c60b4b1a97c90a340933 --- /dev/null +++ b/annotations_filtered/05nQ6FtAaYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.17], [25.0, 24.81], [25.0, 26.05], [27.0, 28.09], [33.0, 33.94], [41.0, 44.44], [46.0, 46.82]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 75.78], ["musical instrument", 5.3], ["theremin", 2.98]], null], "duration": [0.17, -0.19, 1.05, 1.09, 0.94, 3.44, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/05qid4p_cfw_filtered.json b/annotations_filtered/05qid4p_cfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fbc3dd4dfa01ae381bf0650f237b1c65a15522e --- /dev/null +++ b/annotations_filtered/05qid4p_cfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.36], [10.0, 10.23], [12.0, 11.97], [15.0, 16.04], [17.0, 18.57], [21.0, 21.84], [24.0, 26.06], [31.0, 32.93], [38.0, 39.16], [51.0, 51.12], [79.0, 79.57], [89.0, 90.59], [107.0, 106.79], [109.0, 110.4], [136.0, 137.19], [147.0, 148.07], [151.0, 156.1], [160.0, 162.19], [164.0, 168.12], [181.0, 183.51], [184.0, 185.52], [187.0, 192.06], [197.0, 198.56], [202.0, 203.77], [213.0, 212.8], [215.0, 215.0], [223.0, 224.4], [229.0, 230.77], [231.0, 234.67], [238.0, 238.84]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 29.44, 29.05, 31.69, 0.0, 37.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 59.19], ["electronic music", 5.43], ["trance music", 3.77]], null, null, null, null, null, null, null, null, null, [["throbbing", 48.34], ["hum", 38.96], ["music", 6.13]], [["music", 61.62], ["speech", 5.42], ["electronic music", 4.35]], [["music", 70.83], ["electronic music", 5.54], ["static", 3.39]], [["music", 37.68], ["speech", 10.42], ["moo", 4.79]], null, [["music", 67.66], ["whack, thwack", 7.8], ["thunk", 2.1]], null, null, null, null, null, null, [["music", 67.71], ["lullaby", 1.74], ["singing", 1.74]], null], "duration": [0.36, 0.23, -0.03, 1.04, 1.57, 0.84, 2.06, 1.93, 1.16, 0.12, 0.57, 1.59, -0.21, 1.4, 1.19, 1.07, 5.1, 2.19, 4.12, 2.51, 1.52, 5.06, 1.56, 1.77, -0.2, 0.0, 1.4, 1.77, 3.67, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/0668UNhYjXg_filtered.json b/annotations_filtered/0668UNhYjXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd222c2e278b74061d3844bc9fd5632ee9341910 --- /dev/null +++ b/annotations_filtered/0668UNhYjXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.04], [25.0, 26.15], [30.0, 30.91], [35.0, 35.87], [36.0, 36.76], [37.0, 37.42], [41.0, 41.99], [45.0, 44.85], [48.0, 55.02], [56.0, 56.22], [57.0, 57.79], [61.0, 95.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 76.81], ["ambient music", 5.4], ["hum", 2.18]], null, null, null], "duration": [1.04, 1.15, 0.91, 0.87, 0.76, 0.42, 0.99, -0.15, 7.02, 0.22, 0.79, 34.3]} \ No newline at end of file diff --git a/annotations_filtered/06B3m6L5fFw_filtered.json b/annotations_filtered/06B3m6L5fFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8daae6a69e9096f9ca9ec87c6e6ed894336e4bf3 --- /dev/null +++ b/annotations_filtered/06B3m6L5fFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.42], [10.0, 10.81], [14.0, 13.71], [15.0, 16.28], [18.0, 19.55], [21.0, 23.68], [25.0, 26.81], [28.0, 30.65], [31.0, 35.87], [41.0, 41.5], [43.0, 48.32], [50.0, 54.89], [56.0, 58.68], [62.0, 62.31], [63.0, 67.32], [68.0, 68.55], [70.0, 69.72], [73.0, 72.98], [74.0, 76.23], [77.0, 81.36], [88.0, 90.41], [92.0, 94.04], [95.0, 100.89], [102.0, 105.41], [106.0, 107.82], [108.0, 109.09], [109.0, 110.64], [111.0, 113.36], [114.0, 116.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 98.36, 70.58, 0.0, 35.58, 96.54, 93.45, 0.0, 36.94, 0.0, 0.0, 0.0, 97.92, 72.01, 66.51, 85.35, 65.44, 47.94, 0.0, 0.0, 0.0, 91.47, 37.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 33.98], ["hum", 14.66], ["mains hum", 3.77]], null, null, null, [["speech", 63.84], ["sidetone", 11.35], ["telephone", 4.85]], null, null, null, null, null, null, null, null, [["speech", 60.16], ["radio", 8.99], ["inside, small room", 3.07]], null, null, null, null, [["speech", 42.19], ["gong", 7.4], ["tuning fork", 7.26]]], "duration": [0.42, 0.81, -0.29, 1.28, 1.55, 2.68, 1.81, 2.65, 4.87, 0.5, 5.32, 4.89, 2.68, 0.31, 4.32, 0.55, -0.28, -0.02, 2.23, 4.36, 2.41, 2.04, 5.89, 3.41, 1.82, 1.09, 1.64, 2.36, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/06DLNzLaTlE_filtered.json b/annotations_filtered/06DLNzLaTlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3555dedb97bc5e14a17c8728e72d34f116ece2d --- /dev/null +++ b/annotations_filtered/06DLNzLaTlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [8.0, 8.41], [9.0, 9.66], [14.0, 23.63], [24.0, 34.86], [40.0, 47.85], [49.0, 51.19], [53.0, 53.27], [59.0, 58.94], [60.0, 60.45], [61.0, 61.53], [66.0, 66.36], [68.0, 68.47], [69.0, 70.48], [72.0, 72.32], [75.0, 75.46], [78.0, 79.79], [82.0, 82.41], [84.0, 84.87], [88.0, 88.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 31.5, 33.42, 61.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.01], ["synthesizer", 10.4], ["theremin", 5.38]], [["music", 67.78], ["speech", 10.0], ["theremin", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.41, 0.66, 9.63, 10.86, 7.85, 2.19, 0.27, -0.06, 0.45, 0.53, 0.36, 0.47, 1.48, 0.32, 0.46, 1.79, 0.41, 0.87, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/06Its9LhIHQ_filtered.json b/annotations_filtered/06Its9LhIHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb52c99c8a41e1963acfb16b15f471a58c50710f --- /dev/null +++ b/annotations_filtered/06Its9LhIHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 26.91], [28.0, 37.77], [39.0, 68.81], [70.0, 76.72], [78.0, 89.99], [92.0, 97.16], [99.0, 104.04], [107.0, 107.32], [109.0, 118.22], [118.0, 118.39], [118.0, 131.11], [135.0, 145.44]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [28.42, 28.21, 28.92, 29.72, 28.68, 29.33, 30.6, 0.0, 29.54, 0.0, 28.85, 28.54], "audiomae_on_audioset": [[["hum", 16.44], ["speech", 14.18], ["throbbing", 13.85]], [["speech", 37.3], ["vehicle", 23.46], ["boat, water vehicle", 10.19]], [["speech", 64.25], ["music", 10.29], ["hum", 4.25]], [["speech", 74.67], ["music", 16.74], ["hum", 1.28]], [["speech", 61.21], ["music", 10.18], ["hum", 5.67]], [["speech", 64.16], ["music", 9.49], ["synthesizer", 4.09]], [["music", 33.8], ["hum", 21.03], ["throbbing", 19.92]], null, [["music", 42.1], ["whack, thwack", 18.2], ["speech", 8.54]], null, [["speech", 55.26], ["explosion", 12.77], ["burst, pop", 7.2]], [["speech", 50.83], ["eruption", 18.21], ["explosion", 15.18]]], "duration": [13.91, 9.77, 29.81, 6.72, 11.99, 5.16, 5.04, 0.32, 9.22, 0.39, 13.11, 10.44]} \ No newline at end of file diff --git a/annotations_filtered/06L5y4Z9KcE_filtered.json b/annotations_filtered/06L5y4Z9KcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de5b19eabc356809923f45f7fe3a66cf70930b3 --- /dev/null +++ b/annotations_filtered/06L5y4Z9KcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.53], [21.0, 21.15], [28.0, 32.53], [34.0, 44.41], [44.0, 44.51], [45.0, 44.73], [45.0, 48.96], [50.0, 50.31], [52.0, 51.68], [54.0, 54.45], [69.0, 74.07], [75.0, 75.79], [81.0, 81.09], [83.0, 84.23], [86.0, 86.26], [88.0, 89.16], [92.0, 93.58], [95.0, 94.93], [97.0, 109.78], [112.0, 112.38], [113.0, 113.95], [124.0, 125.31], [126.0, 126.39], [128.0, 130.01], [132.0, 133.56], [138.0, 142.47], [145.0, 145.18], [146.0, 146.42], [147.0, 157.22], [158.0, 161.25], [165.0, 167.9], [168.0, 167.95], [169.0, 168.94]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.16, 33.87, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.85, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 31.61, 0.0, 0.0, 33.0, 81.89, 82.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.04], ["mosquito", 12.57], ["insect", 12.29]], [["electric shaver, electric razor", 43.47], ["mains hum", 25.92], ["hum", 14.2]], null, null, null, null, null, null, [["music", 63.24], ["effects unit", 9.91], ["guitar", 6.26]], null, null, null, null, null, null, null, [["speech", 31.88], ["mains hum", 14.2], ["hum", 14.01]], null, null, null, null, null, null, [["fart", 17.88], ["music", 13.06], ["explosion", 12.87]], null, null, [["buzz", 50.24], ["fly, housefly", 17.78], ["insect", 10.61]], null, null, null, null], "duration": [1.53, 0.15, 4.53, 10.41, 0.51, -0.27, 3.96, 0.31, -0.32, 0.45, 5.07, 0.79, 0.09, 1.23, 0.26, 1.16, 1.58, -0.07, 12.78, 0.38, 0.95, 1.31, 0.39, 2.01, 1.56, 4.47, 0.18, 0.42, 10.22, 3.25, 2.9, -0.05, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/06lJhEc7zIo_filtered.json b/annotations_filtered/06lJhEc7zIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6108254577e451b2876a55c9aa22e2cf87ee8cae --- /dev/null +++ b/annotations_filtered/06lJhEc7zIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.62], [16.0, 18.71], [19.0, 20.43], [21.0, 22.28], [23.0, 32.29], [33.0, 35.51], [36.0, 47.26], [48.0, 49.37], [54.0, 54.41], [57.0, 57.54], [60.0, 66.04], [77.0, 76.77], [83.0, 83.78], [90.0, 91.96], [106.0, 107.86], [113.0, 113.68], [117.0, 117.44], [121.0, 120.75], [121.0, 122.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 84.43, 0.0, 0.0, 99.92, 98.59, 84.8, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.62, 2.71, 1.43, 1.28, 9.29, 2.51, 11.26, 1.37, 0.41, 0.54, 6.04, -0.23, 0.78, 1.96, 1.86, 0.68, 0.44, -0.25, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/06qgu4XoNL4_filtered.json b/annotations_filtered/06qgu4XoNL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..119b179c7f49a953464730bf4545850f20fb8a87 --- /dev/null +++ b/annotations_filtered/06qgu4XoNL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [7.0, 8.36], [9.0, 9.69], [10.0, 11.08], [12.0, 13.22], [15.0, 17.86], [18.0, 19.2], [20.0, 21.98], [22.0, 22.23], [22.0, 24.56], [31.0, 34.21], [39.0, 41.98], [43.0, 51.97], [54.0, 54.51], [61.0, 62.58], [67.0, 69.89], [70.0, 71.22], [74.0, 77.57], [78.0, 78.87], [81.0, 81.87], [83.0, 85.56], [87.0, 87.18], [89.0, 89.94], [91.0, 94.1], [95.0, 95.89], [100.0, 100.26], [101.0, 101.53], [102.0, 102.03], [104.0, 104.6], [117.0, 116.88], [118.0, 118.81], [119.0, 120.04], [121.0, 121.27], [122.0, 129.9], [145.0, 146.42], [147.0, 153.86], [157.0, 157.05], [158.0, 158.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.48, 0.0, 0.0, 0.0, 32.94, 36.32, 32.13, 42.79, 0.0, 0.0, 39.86, 0.0, 42.08, 0.0, 0.0, 47.86, 0.0, 0.0, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.44, 0.0, 41.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 83.86], ["musical instrument", 3.73], ["electronic music", 2.81]], null, null, null, [["speech", 41.07], ["music", 39.75], ["sonar", 2.58]], [["livestock, farm animals, working animals", 43.24], ["cattle, bovinae", 31.91], ["moo", 16.67]], [["cattle, bovinae", 22.43], ["speech", 22.12], ["livestock, farm animals, working animals", 17.92]], [["music", 25.76], ["didgeridoo", 19.8], ["speech", 15.61]], null, null, [["speech", 87.55], ["radio", 3.48], ["speech synthesizer", 0.77]], null, [["speech", 38.27], ["music", 14.65], ["boing", 6.65]], null, null, [["heart sounds, heartbeat", 22.74], ["throbbing", 18.96], ["hum", 15.19]], null, null, [["speech", 57.35], ["sidetone", 11.02], ["music", 9.47]], null, null, null, null, null, null, null, null, null, [["music", 71.6], ["guitar", 6.11], ["bass guitar", 5.83]], null, [["music", 28.15], ["hum", 12.62], ["throbbing", 11.28]], null, null], "duration": [1.17, 1.36, 0.69, 1.08, 1.22, 2.86, 1.2, 1.98, 0.23, 2.56, 3.21, 2.98, 8.97, 0.51, 1.58, 2.89, 1.22, 3.57, 0.87, 0.87, 2.56, 0.18, 0.94, 3.1, 0.89, 0.26, 0.53, 0.03, 0.6, -0.12, 0.81, 1.04, 0.27, 7.9, 1.42, 6.86, 0.05, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/06u-a5jmi6o_filtered.json b/annotations_filtered/06u-a5jmi6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ee6bd08fe900888f8e3f88cde775a5a5414fcc3 --- /dev/null +++ b/annotations_filtered/06u-a5jmi6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.68], [7.0, 11.94], [19.0, 27.92], [31.0, 37.86], [39.0, 44.71], [46.0, 55.27]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 99.05, 35.57, 36.05, 35.42, 35.29], "audiomae_on_audioset": [null, null, [["music", 61.22], ["musical instrument", 10.02], ["flamenco", 4.87]], [["music", 70.82], ["singing", 5.31], ["musical instrument", 4.68]], [["music", 52.73], ["singing", 5.44], ["percussion", 5.01]], [["music", 80.77], ["singing", 4.39], ["musical instrument", 2.53]]], "duration": [1.68, 4.94, 8.92, 6.86, 5.71, 9.27]} \ No newline at end of file diff --git a/annotations_filtered/07FdVcspOfQ_filtered.json b/annotations_filtered/07FdVcspOfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ac8cbf41048bad160776ece1ccf83e50881dcc7 --- /dev/null +++ b/annotations_filtered/07FdVcspOfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.91], [9.0, 10.13], [11.0, 11.43], [13.0, 13.51], [15.0, 17.41], [19.0, 19.58], [23.0, 23.45], [25.0, 25.41], [28.0, 29.73], [31.0, 32.04], [34.0, 34.38], [36.0, 37.08], [61.0, 62.68], [64.0, 64.18], [66.0, 66.18], [67.0, 67.91], [77.0, 77.28], [78.0, 78.87], [86.0, 86.16], [92.0, 91.93], [93.0, 93.82], [98.0, 97.8], [108.0, 108.16], [120.0, 119.92], [123.0, 123.33], [129.0, 129.56], [135.0, 145.03], [149.0, 159.85], [160.0, 161.42], [163.0, 166.62], [167.0, 168.56], [171.0, 174.56]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.54, 50.81, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, [["frog", 17.51], ["speech", 13.85], ["croak", 13.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 20.72], ["cattle, bovinae", 18.28], ["livestock, farm animals, working animals", 12.42]], null, null, null, null, null], "duration": [1.91, 1.13, 0.43, 0.51, 2.41, 0.58, 0.45, 0.41, 1.73, 1.04, 0.38, 1.08, 1.68, 0.18, 0.18, 0.91, 0.28, 0.87, 0.16, -0.07, 0.82, -0.2, 0.16, -0.08, 0.33, 0.56, 10.03, 10.85, 1.42, 3.62, 1.56, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/07GcBnddoMU_filtered.json b/annotations_filtered/07GcBnddoMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63cbee2fc67730a4ff1715fda124488e6cc0a1bc --- /dev/null +++ b/annotations_filtered/07GcBnddoMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 64.29], [65.0, 77.09], [79.0, 88.57], [91.0, 109.56], [112.0, 113.98], [115.0, 124.46], [126.0, 125.59], [126.0, 133.12], [134.0, 134.03], [138.0, 140.93], [142.0, 142.86], [146.0, 146.25], [148.0, 148.29], [152.0, 152.93], [156.0, 166.83]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.78, 55.39, 94.66, 0.0, 36.83, 0.0, 82.97, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 94.22], "audiomae_on_audioset": [null, [["music", 35.27], ["groan", 4.95], ["animal", 4.06]], null, null, null, [["speech", 52.58], ["whack, thwack", 24.32], ["breaking", 9.51]], null, null, null, null, null, null, null, null, null], "duration": [1.29, 12.09, 9.57, 18.56, 1.98, 9.46, -0.41, 7.12, 0.03, 2.93, 0.86, 0.25, 0.29, 0.93, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/07YuuA_2O9w_filtered.json b/annotations_filtered/07YuuA_2O9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0f464859599379c0a78c67154b379645c60115b --- /dev/null +++ b/annotations_filtered/07YuuA_2O9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.73], [13.0, 13.29], [21.0, 22.38], [26.0, 26.01], [29.0, 29.96], [32.0, 32.27], [53.0, 53.25], [58.0, 58.23], [60.0, 60.45], [68.0, 68.52], [73.0, 72.99], [79.0, 79.42], [81.0, 81.03], [87.0, 86.83], [90.0, 90.48], [100.0, 100.26], [102.0, 106.22], [118.0, 118.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [44.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0], "audiomae_on_audioset": [[["hum", 43.48], ["mains hum", 39.32], ["throbbing", 8.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["breaking", 22.4], ["dishes, pots, and pans", 11.91], ["smash, crash", 8.9]], null], "duration": [3.73, 0.29, 1.38, 0.01, 0.96, 0.27, 0.25, 0.23, 0.45, 0.52, -0.01, 0.42, 0.03, -0.17, 0.48, 0.26, 4.22, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/07kluxoO8j8_filtered.json b/annotations_filtered/07kluxoO8j8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e086ff25cf4031b6fb1f41cda36ea28a868c189c --- /dev/null +++ b/annotations_filtered/07kluxoO8j8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [12.0, 12.6], [14.0, 14.98], [18.0, 18.22], [32.0, 34.01], [38.0, 40.05], [42.0, 44.39], [46.0, 52.12], [53.0, 64.59], [70.0, 74.21], [75.0, 81.5], [86.0, 98.64], [102.0, 111.92], [114.0, 123.69], [127.0, 126.64], [130.0, 130.92], [136.0, 139.53], [143.0, 143.88], [147.0, 150.72], [151.0, 154.08], [155.0, 157.89], [161.0, 164.81], [167.0, 171.71], [172.0, 184.54], [186.0, 200.04]], "keep_status": [false, false, false, false, false, false, true, true, true, true, true, true, false, false, false, false, false, false, true, true, true, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.73, 34.2, 33.72, 35.57, 33.89, 36.59, 35.76, 29.87, 29.42, 29.36, 0.0, 0.0, 30.8, 0.0, 28.7, 28.88, 29.27, 29.01, 30.75, 29.15, 29.25], "audiomae_on_audioset": [null, null, null, null, [["speech", 28.26], ["music", 24.28], ["hum", 21.43]], [["music", 73.34], ["hum", 4.63], ["electronic music", 3.03]], [["speech", 24.28], ["sidetone", 20.96], ["music", 15.12]], [["music", 43.26], ["hum", 15.94], ["noise", 7.85]], [["speech", 37.44], ["music", 18.56], ["hum", 10.47]], [["music", 37.86], ["effects unit", 8.16], ["synthesizer", 6.31]], [["music", 57.0], ["animal", 8.24], ["musical instrument", 4.41]], [["livestock, farm animals, working animals", 31.29], ["cattle, bovinae", 23.17], ["speech", 14.1]], [["music", 75.34], ["speech", 2.23], ["musical instrument", 1.92]], [["music", 39.57], ["hum", 21.75], ["mains hum", 9.2]], null, null, [["hum", 39.25], ["mains hum", 30.73], ["throbbing", 18.51]], null, [["music", 17.25], ["speech", 8.26], ["vehicle", 7.54]], [["music", 20.03], ["rumble", 14.29], ["mains hum", 7.13]], [["music", 32.78], ["whale vocalization", 13.05], ["speech", 8.58]], [["music", 48.44], ["cacophony", 17.03], ["throbbing", 3.41]], [["music", 55.04], ["brass instrument", 6.63], ["trombone", 6.42]], [["music", 34.22], ["throbbing", 11.13], ["hum", 8.52]], [["music", 38.14], ["speech", 22.32], ["throbbing", 4.56]]], "duration": [0.32, 0.6, 0.98, 0.22, 2.01, 2.05, 2.39, 6.12, 11.59, 4.21, 6.5, 12.64, 9.92, 9.69, -0.36, 0.92, 3.53, 0.88, 3.72, 3.08, 2.89, 3.81, 4.71, 12.54, 14.04]} \ No newline at end of file diff --git a/annotations_filtered/080g4Ylkv2M_filtered.json b/annotations_filtered/080g4Ylkv2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7eddccf5fb9333202cc6f56c140f33728ede8b2d --- /dev/null +++ b/annotations_filtered/080g4Ylkv2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [6.0, 10.2], [13.0, 26.65], [30.0, 41.94], [44.0, 44.56], [46.0, 48.17], [49.0, 50.84], [52.0, 63.39], [72.0, 76.55], [78.0, 80.35], [81.0, 81.8], [85.0, 84.57], [86.0, 89.82], [92.0, 92.25]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.52, 29.54, 29.42, 0.0, 30.74, 0.0, 34.68, 99.65, 99.87, 0.0, 0.0, 67.51, 0.0], "audiomae_on_audioset": [null, [["music", 42.02], ["theremin", 39.4], ["synthesizer", 4.93]], [["hum", 32.83], ["music", 28.76], ["mains hum", 19.53]], [["music", 45.6], ["whale vocalization", 20.24], ["theremin", 9.84]], null, [["speech", 22.69], ["cattle, bovinae", 16.39], ["moo", 15.2]], null, [["music", 56.87], ["effects unit", 11.47], ["guitar", 7.71]], null, null, null, null, null, null], "duration": [0.35, 4.2, 13.65, 11.94, 0.56, 2.17, 1.84, 11.39, 4.55, 2.35, 0.8, -0.43, 3.82, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/081zoKkdEYA_filtered.json b/annotations_filtered/081zoKkdEYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1464e4db0bedd445d5a2388468347c3fdd6cac0 --- /dev/null +++ b/annotations_filtered/081zoKkdEYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 101.24], [102.0, 111.79], [115.0, 128.63], [129.0, 129.52]], "keep_status": [true, false, true, false], "silence_prob": [28.89, 29.53, 36.4, 0.0], "audiomae_on_audioset": [[["music", 17.28], ["speech", 9.63], ["rumble", 8.01]], [["music", 66.13], ["speech", 3.56], ["throbbing", 3.48]], [["hum", 21.18], ["speech", 12.96], ["groan", 11.95]], null], "duration": [3.24, 9.79, 13.63, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/088CLxgnr8w_filtered.json b/annotations_filtered/088CLxgnr8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1550ad1855fe0025a3cada787b66ba55ed9f5ad6 --- /dev/null +++ b/annotations_filtered/088CLxgnr8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [5.0, 5.66], [10.0, 11.47], [12.0, 15.58], [16.0, 18.39], [19.0, 20.88], [22.0, 23.36], [24.0, 25.66], [27.0, 31.51], [33.0, 34.75], [37.0, 37.54], [46.0, 46.3], [55.0, 65.37], [72.0, 73.28], [76.0, 76.76], [105.0, 109.17], [113.0, 114.4], [117.0, 117.56], [121.0, 126.77], [129.0, 141.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.1, 54.43, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 56.63, 0.0, 0.0, 54.56, 0.0, 0.0, 57.89, 54.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 0.66, 1.47, 3.58, 2.39, 1.88, 1.36, 1.66, 4.51, 1.75, 0.54, 0.3, 10.37, 1.28, 0.76, 4.17, 1.4, 0.56, 5.77, 12.51]} \ No newline at end of file diff --git a/annotations_filtered/08NzJRNAFGc_filtered.json b/annotations_filtered/08NzJRNAFGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e80e9a4e5b715823bfa635b671450977fda8ee1 --- /dev/null +++ b/annotations_filtered/08NzJRNAFGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.82], [20.0, 23.9], [28.0, 28.53], [31.0, 32.37], [34.0, 34.82], [35.0, 35.94], [36.0, 37.94], [38.0, 40.59], [41.0, 42.03], [43.0, 44.31], [46.0, 49.33], [51.0, 53.54], [56.0, 57.13], [60.0, 67.05], [68.0, 70.43], [71.0, 72.96], [74.0, 76.69], [78.0, 78.95], [79.0, 81.53], [82.0, 83.73], [91.0, 90.85], [98.0, 98.86], [103.0, 104.14], [106.0, 107.7], [114.0, 114.2], [118.0, 118.42], [119.0, 119.62], [122.0, 124.31], [126.0, 126.67]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [50.06, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 33.63, 0.0, 0.0, 54.97, 98.59, 0.0, 83.52, 92.15, 0.0, 70.02, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0], "audiomae_on_audioset": [null, [["speech", 29.92], ["sidetone", 22.5], ["hum", 10.62]], null, null, null, null, null, [["stomach rumble", 42.7], ["sine wave", 11.39], ["fart", 6.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.82, 3.9, 0.53, 1.37, 0.82, 0.94, 1.94, 2.59, 1.03, 1.31, 3.33, 2.54, 1.13, 7.05, 2.43, 1.96, 2.69, 0.95, 2.53, 1.73, -0.15, 0.86, 1.14, 1.7, 0.2, 0.42, 0.62, 2.31, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/08iCLTmybXM_filtered.json b/annotations_filtered/08iCLTmybXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cd26fdb54fc63b8275ffcd6064374e41f994858 --- /dev/null +++ b/annotations_filtered/08iCLTmybXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [8.0, 10.0], [14.0, 14.23], [16.0, 16.48], [23.0, 26.01], [27.0, 28.16], [29.0, 29.83], [31.0, 32.68], [35.0, 35.33], [37.0, 36.93], [37.0, 37.86], [39.0, 39.01], [43.0, 43.53], [45.0, 45.33], [49.0, 48.93], [49.0, 52.62], [55.0, 55.63], [56.0, 56.69], [61.0, 61.47], [63.0, 63.42], [76.0, 76.38], [77.0, 78.16], [81.0, 81.09], [87.0, 88.48], [95.0, 95.67], [103.0, 103.3], [104.0, 104.75], [108.0, 108.36], [113.0, 113.39], [115.0, 115.96], [118.0, 118.57], [120.0, 120.6], [121.0, 121.73], [123.0, 124.14], [125.0, 126.22], [127.0, 127.7], [129.0, 129.02], [131.0, 131.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.6, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.55], ["hum", 20.92], ["bee, wasp, etc.", 18.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 2.0, 0.23, 0.48, 3.01, 1.16, 0.83, 1.68, 0.33, -0.07, 0.86, 0.01, 0.53, 0.33, -0.07, 3.62, 0.63, 0.69, 0.47, 0.42, 0.38, 1.16, 0.09, 1.48, 0.67, 0.3, 0.75, 0.36, 0.39, 0.96, 0.57, 0.6, 0.73, 1.14, 1.22, 0.7, 0.02, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/08rJmhhQHtY_filtered.json b/annotations_filtered/08rJmhhQHtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5b771ec777eb43b6839937638bb50f1a612ebac --- /dev/null +++ b/annotations_filtered/08rJmhhQHtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.83], [10.0, 12.38], [21.0, 33.42], [38.0, 45.1], [46.0, 46.36], [50.0, 50.97], [52.0, 54.33], [55.0, 56.02], [58.0, 58.77], [64.0, 64.59], [66.0, 67.42], [70.0, 70.21], [75.0, 85.21], [88.0, 89.68], [91.0, 91.25], [92.0, 92.06], [93.0, 98.66], [99.0, 100.04], [106.0, 106.76], [109.0, 114.71], [115.0, 119.3]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 51.71, 44.69, 39.91, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 81.0, 45.69], "audiomae_on_audioset": [null, null, [["male singing", 29.4], ["speech", 29.3], ["clapping", 10.78]], [["speech", 60.62], ["fart", 5.94], ["moo", 3.11]], null, null, [["speech", 21.71], ["clapping", 6.3], ["livestock, farm animals, working animals", 5.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.7], ["hands", 8.2], ["music", 8.1]]], "duration": [0.83, 2.38, 12.42, 7.1, 0.36, 0.97, 2.33, 1.02, 0.77, 0.59, 1.42, 0.21, 10.21, 1.68, 0.25, 0.06, 5.66, 1.04, 0.76, 5.71, 4.3]} \ No newline at end of file diff --git a/annotations_filtered/09MjH5hbF5Y_filtered.json b/annotations_filtered/09MjH5hbF5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a788c90a2ba90b168b64c832ef8810c2aa5387ee --- /dev/null +++ b/annotations_filtered/09MjH5hbF5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.35], [4.0, 4.24], [9.0, 8.78], [15.0, 22.03], [24.0, 24.65], [27.0, 27.06], [28.0, 30.35], [32.0, 32.46], [35.0, 34.91], [38.0, 38.31], [42.0, 47.38], [50.0, 51.85], [56.0, 57.33], [59.0, 59.7], [61.0, 61.69], [64.0, 64.35], [66.0, 66.56], [70.0, 71.0], [73.0, 74.83], [78.0, 78.78], [82.0, 89.88], [94.0, 97.14], [98.0, 100.75], [103.0, 112.01], [113.0, 115.33]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 63.31, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 64.29, 55.6, 85.17, 94.52], "audiomae_on_audioset": [null, null, null, [["animal", 30.69], ["livestock, farm animals, working animals", 9.56], ["cattle, bovinae", 9.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 35.25], ["bee, wasp, etc.", 6.93], ["insect", 5.1]], null, null, null, null], "duration": [0.35, 0.24, -0.22, 7.03, 0.65, 0.06, 2.35, 0.46, -0.09, 0.31, 5.38, 1.85, 1.33, 0.7, 0.69, 0.35, 0.56, 1.0, 1.83, 0.78, 7.88, 3.14, 2.75, 9.01, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/09idDzvkxZ0_filtered.json b/annotations_filtered/09idDzvkxZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cde1d2a73e9c9f597554640c11a985e45701323 --- /dev/null +++ b/annotations_filtered/09idDzvkxZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [25.0, 26.3], [41.0, 41.42], [44.0, 44.12], [46.0, 46.25]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.51, 1.3, 0.42, 0.12, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/09m9ltjwuJU_filtered.json b/annotations_filtered/09m9ltjwuJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f84c0e5735b18c1ef20a041a2331b7e6ba7a1340 --- /dev/null +++ b/annotations_filtered/09m9ltjwuJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.72], [21.0, 25.69], [35.0, 35.33], [55.0, 55.16], [60.0, 60.94], [62.0, 62.67], [86.0, 86.63], [91.0, 91.57], [92.0, 96.06], [97.0, 98.85], [100.0, 100.43], [104.0, 105.21], [106.0, 106.15], [107.0, 107.72], [108.0, 108.31], [108.0, 108.87], [115.0, 115.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 4.69, 0.33, 0.16, 0.94, 0.67, 0.63, 0.57, 4.06, 1.85, 0.43, 1.21, 0.15, 0.72, 0.31, 0.87, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/09oumdE0UFI_filtered.json b/annotations_filtered/09oumdE0UFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19e32a59728da93eefa7115f92ec677f187fdefc --- /dev/null +++ b/annotations_filtered/09oumdE0UFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [12.0, 13.29], [20.0, 20.07], [22.0, 26.27], [32.0, 32.73], [33.0, 33.44], [35.0, 35.65], [36.0, 39.41], [52.0, 53.7], [60.0, 60.34], [64.0, 66.53], [72.0, 73.48], [75.0, 78.34], [83.0, 83.84], [84.0, 87.0], [90.0, 90.0], [92.0, 92.82], [97.0, 99.05], [102.0, 104.3], [104.0, 104.43], [110.0, 111.32], [117.0, 118.29], [124.0, 125.02], [136.0, 137.78], [139.0, 138.96], [139.0, 144.96], [147.0, 150.47], [155.0, 158.38], [162.0, 166.29], [166.0, 166.33], [168.0, 168.12], [170.0, 172.83], [178.0, 178.06], [182.0, 187.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 50.91, 0.0, 47.27, 0.0, 48.31, 0.0, 0.0, 45.24, 57.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 42.93, 37.39, 44.57, 0.0, 0.0, 46.12, 0.0, 40.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.26], ["didgeridoo", 7.97], ["theremin", 3.5]], null, [["music", 49.5], ["carnatic music", 7.57], ["musical instrument", 5.31]], null, null, [["music", 48.97], ["a capella", 6.56], ["choir", 6.29]], null, null, null, null, null, null, null, [["music", 65.34], ["cello", 5.5], ["lullaby", 3.37]], [["theremin", 45.11], ["music", 30.4], ["cello", 6.03]], [["music", 61.92], ["theremin", 9.88], ["humming", 9.51]], [["theremin", 65.84], ["music", 26.71], ["musical instrument", 0.95]], null, null, [["music", 57.18], ["singing", 6.65], ["chant", 5.33]], null, [["music", 38.08], ["theremin", 35.79], ["moo", 3.41]]], "duration": [0.51, 1.29, 0.07, 4.27, 0.73, 0.44, 0.65, 3.41, 1.7, 0.34, 2.53, 1.48, 3.34, 0.84, 3.0, 0.0, 0.82, 2.05, 2.3, 0.43, 1.32, 1.29, 1.02, 1.78, -0.04, 5.96, 3.47, 3.38, 4.29, 0.33, 0.12, 2.83, 0.06, 5.34]} \ No newline at end of file diff --git a/annotations_filtered/09zP4iK6QuI_filtered.json b/annotations_filtered/09zP4iK6QuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d97763d47fc3c0312caa01f4d81179fd66e033 --- /dev/null +++ b/annotations_filtered/09zP4iK6QuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.88], [20.0, 24.65], [26.0, 28.27], [28.0, 28.39], [29.0, 31.4], [38.0, 38.26], [46.0, 46.21], [53.0, 56.52], [59.0, 79.62], [90.0, 90.41], [97.0, 96.92], [98.0, 99.25], [101.0, 102.84], [104.0, 104.82], [105.0, 111.08], [111.0, 112.36], [115.0, 117.53]], "keep_status": [false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 37.82, 30.39, 0.0, 46.72, 0.0, 0.0, 35.25, 37.1, 0.0, 0.0, 0.0, 0.0, 0.0, 36.49, 0.0, 39.52], "audiomae_on_audioset": [null, [["music", 40.62], ["throbbing", 14.04], ["hum", 12.85]], [["music", 37.31], ["throbbing", 17.45], ["hum", 11.19]], null, [["speech", 24.3], ["music", 17.77], ["radio", 16.7]], null, null, [["speech", 35.46], ["thunk", 8.59], ["music", 7.29]], [["music", 46.28], ["glass", 25.95], ["theremin", 3.11]], null, null, null, null, null, [["hum", 53.41], ["mains hum", 17.14], ["throbbing", 7.7]], null, [["speech", 16.14], ["rumble", 12.84], ["music", 7.88]]], "duration": [-0.12, 4.65, 2.27, 0.39, 2.4, 0.26, 0.21, 3.52, 20.62, 0.41, -0.08, 1.25, 1.84, 0.82, 6.08, 1.36, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/0A0VANPUG-g_filtered.json b/annotations_filtered/0A0VANPUG-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd394194114cd4618330c335c22436ae39f92a73 --- /dev/null +++ b/annotations_filtered/0A0VANPUG-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 25.68], [27.0, 28.58], [30.0, 31.78], [32.0, 34.11], [35.0, 36.58], [37.0, 44.78], [47.0, 48.34], [49.0, 50.4], [51.0, 85.73], [87.0, 93.9], [95.0, 96.53], [98.0, 97.63], [98.0, 100.43], [103.0, 104.21], [106.0, 110.32], [111.0, 118.37], [119.0, 121.17], [123.0, 124.6], [125.0, 128.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 0.0, 0.0, 94.95, 0.0, 89.01, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 88.28, 0.0, 99.65, 81.0, 100.0, 0.0, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.68, 1.58, 1.78, 2.11, 1.58, 7.78, 1.34, 1.4, 34.73, 6.9, 1.53, -0.37, 2.43, 1.21, 4.32, 7.37, 2.17, 1.6, 3.28]} \ No newline at end of file diff --git a/annotations_filtered/0A80j2BuMaU_filtered.json b/annotations_filtered/0A80j2BuMaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ac4fe4a6098f5961adb3162ecbd29e3850b069e --- /dev/null +++ b/annotations_filtered/0A80j2BuMaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [10.0, 11.26], [12.0, 14.28], [18.0, 18.33], [19.0, 19.65], [22.0, 22.71], [23.0, 24.09], [25.0, 34.38], [35.0, 37.99], [39.0, 39.45], [41.0, 48.88], [53.0, 64.49], [65.0, 66.33], [67.0, 69.33], [70.0, 71.96], [73.0, 76.4], [78.0, 80.62], [81.0, 85.29], [86.0, 91.0], [92.0, 91.86], [94.0, 137.19], [138.0, 141.15], [142.0, 160.52], [164.0, 163.7]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.16, 0.0, 0.0, 0.0, 0.0, 84.98, 59.15, 0.0, 36.12, 44.6, 0.0, 74.44, 0.0, 46.9, 50.26, 72.31, 53.47, 0.0, 0.0, 62.99, 82.07, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 24.59], ["hum", 6.42], ["bee, wasp, etc.", 5.97]], null, null, null, null, null, null, null, [["speech", 56.51], ["explosion", 8.57], ["eruption", 4.59]], [["hum", 44.62], ["mains hum", 18.52], ["throbbing", 9.22]], null, null, null, [["whale vocalization", 40.61], ["livestock, farm animals, working animals", 9.12], ["music", 6.94]], null, null, null, null, null, null, null, null], "duration": [0.55, 1.26, 2.28, 0.33, 0.65, 0.71, 1.09, 9.38, 2.99, 0.45, 7.88, 11.49, 1.33, 2.33, 1.96, 3.4, 2.62, 4.29, 5.0, -0.14, 43.19, 3.15, 18.52, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/0A9ppII7eVA_filtered.json b/annotations_filtered/0A9ppII7eVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61abd11c230a444d56c8a3fe116cb7d3fc95f083 --- /dev/null +++ b/annotations_filtered/0A9ppII7eVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [7.0, 8.94], [10.0, 10.77], [15.0, 16.61], [26.0, 28.26], [33.0, 33.1], [37.0, 37.4], [40.0, 40.56], [42.0, 43.17], [47.0, 48.03], [51.0, 53.99], [55.0, 56.08], [57.0, 59.19], [60.0, 60.17], [62.0, 62.48], [63.0, 63.63], [67.0, 67.26], [68.0, 68.96], [71.0, 71.37], [76.0, 77.06], [78.0, 80.57], [83.0, 82.93], [87.0, 87.59], [89.0, 90.81], [96.0, 98.24], [103.0, 102.78], [106.0, 109.53], [112.0, 113.85], [116.0, 117.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 34.28, 0.0, 43.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.25, 0.0, 0.0, 0.0, 56.48, 0.0, 31.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["radio", 23.08], ["music", 16.6], ["speech", 16.15]], null, null, null, null, null, [["speech", 45.08], ["sidetone", 24.91], ["radio", 2.67]], null, [["speech", 64.46], ["radio", 18.39], ["sidetone", 3.86]], null, null, null, null, null, null, null, [["whale vocalization", 59.93], ["theremin", 11.64], ["music", 4.76]], null, null, null, null, null, [["speech", 10.03], ["hum", 9.81], ["crowd", 8.39]], null, null], "duration": [0.69, 1.94, 0.77, 1.61, 2.26, 0.1, 0.4, 0.56, 1.17, 1.03, 2.99, 1.08, 2.19, 0.17, 0.48, 0.63, 0.26, 0.96, 0.37, 1.06, 2.57, -0.07, 0.59, 1.81, 2.24, -0.22, 3.53, 1.85, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/0ACTvENkyD8_filtered.json b/annotations_filtered/0ACTvENkyD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3821fcdc7547a3af05260ffb660b2d3a41895d0a --- /dev/null +++ b/annotations_filtered/0ACTvENkyD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.02], [23.0, 23.99], [25.0, 27.4], [28.0, 30.38], [32.0, 34.05], [36.0, 36.86], [38.0, 39.21], [40.0, 42.4], [43.0, 53.67], [54.0, 60.0], [61.0, 76.72], [79.0, 88.48], [89.0, 118.4], [119.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [29.52, 0.0, 84.98, 45.36, 79.07, 0.0, 0.0, 54.5, 38.42, 38.14, 28.74, 35.33, 28.92, 0.0], "audiomae_on_audioset": [[["speech", 41.36], ["music", 28.54], ["didgeridoo", 6.52]], null, null, [["busy signal", 52.25], ["music", 15.58], ["synthesizer", 5.23]], null, null, null, null, [["speech", 35.21], ["music", 24.17], ["animal", 4.96]], [["music", 29.32], ["dog", 15.91], ["animal", 10.52]], [["music", 74.38], ["throbbing", 4.72], ["sound effect", 2.06]], [["music", 50.89], ["speech", 16.07], ["livestock, farm animals, working animals", 4.29]], [["music", 48.79], ["groan", 6.93], ["fly, housefly", 6.43]], null], "duration": [19.02, 0.99, 2.4, 2.38, 2.05, 0.86, 1.21, 2.4, 10.67, 6.0, 15.72, 9.48, 29.4, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/0AUpWC9Whfs_filtered.json b/annotations_filtered/0AUpWC9Whfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..323efbee0ca83a564eaf9bf4aed4b1bda2ae9fde --- /dev/null +++ b/annotations_filtered/0AUpWC9Whfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.96], [13.0, 14.37], [16.0, 17.44], [19.0, 20.93], [22.0, 25.66], [29.0, 30.33], [31.0, 32.76], [33.0, 38.28], [40.0, 40.85], [42.0, 43.17], [45.0, 48.96], [50.0, 53.72], [57.0, 58.4], [62.0, 62.34], [67.0, 67.1], [72.0, 73.84], [74.0, 76.94], [78.0, 79.86], [81.0, 83.35], [84.0, 86.14], [88.0, 91.39], [92.0, 94.19], [95.0, 99.13], [100.0, 103.76], [107.0, 111.2], [113.0, 112.99], [115.0, 124.58], [126.0, 126.1], [126.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 94.95, 0.0, 0.0, 92.97, 76.7, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 78.04, 99.36, 93.45, 97.33, 73.06, 78.72, 59.24, 0.0, 37.92, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.97], ["theremin", 4.66], ["ambient music", 3.38]], null, null], "duration": [0.96, 1.37, 1.44, 1.93, 3.66, 1.33, 1.76, 5.28, 0.85, 1.17, 3.96, 3.72, 1.4, 0.34, 0.1, 1.84, 2.94, 1.86, 2.35, 2.14, 3.39, 2.19, 4.13, 3.76, 4.2, -0.01, 9.58, 0.1, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/0AslM2bC5DY_filtered.json b/annotations_filtered/0AslM2bC5DY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a1721adadb0826b41822e7d2a3d074c1adb81c9 --- /dev/null +++ b/annotations_filtered/0AslM2bC5DY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.67], [12.0, 26.15], [31.0, 31.67], [32.0, 32.76], [37.0, 40.1], [42.0, 42.97], [44.0, 48.57], [49.0, 51.04], [55.0, 58.48], [59.0, 62.16], [62.0, 70.5], [71.0, 72.4], [73.0, 78.36], [80.0, 95.2], [96.0, 98.51], [100.0, 105.27], [107.0, 109.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.52, 0.0, 0.0, 99.97, 0.0, 100.0, 100.0, 100.0, 99.1, 99.8, 0.0, 99.98, 99.88, 99.93, 100.0, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 14.15, 0.67, 0.76, 3.1, 0.97, 4.57, 2.04, 3.48, 3.16, 8.5, 1.4, 5.36, 15.2, 2.51, 5.27, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/0AspXDFcGlw_filtered.json b/annotations_filtered/0AspXDFcGlw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d4db5dc6f1d7c234ccdeeca5d205a2ff6942652 --- /dev/null +++ b/annotations_filtered/0AspXDFcGlw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [7.0, 8.07], [9.0, 8.97], [14.0, 14.3], [15.0, 15.7], [20.0, 20.21], [25.0, 25.51], [26.0, 26.69], [27.0, 27.95], [28.0, 29.88], [35.0, 35.26], [38.0, 38.99], [42.0, 42.2], [44.0, 44.27], [46.0, 46.47], [49.0, 49.2], [51.0, 50.55], [53.0, 54.31], [57.0, 57.21], [60.0, 60.96], [62.0, 61.87], [67.0, 68.13], [69.0, 68.98], [72.0, 72.55], [73.0, 73.01], [74.0, 75.17], [78.0, 100.85], [104.0, 105.16], [108.0, 109.02], [111.0, 111.82], [113.0, 113.85], [115.0, 115.7], [118.0, 118.88], [121.0, 122.05], [124.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.07, -0.03, 0.3, 0.7, 0.21, 0.51, 0.69, 0.95, 1.88, 0.26, 0.99, 0.2, 0.27, 0.47, 0.2, -0.45, 1.31, 0.21, 0.96, -0.13, 1.13, -0.02, 0.55, 0.01, 1.17, 22.85, 1.16, 1.02, 0.82, 0.85, 0.7, 0.88, 1.05, 4.26]} \ No newline at end of file diff --git a/annotations_filtered/0B0YWUYWHS8_filtered.json b/annotations_filtered/0B0YWUYWHS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0B0YWUYWHS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0B1NRC3WYEs_filtered.json b/annotations_filtered/0B1NRC3WYEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0B1NRC3WYEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0BF9MkmTBjk_filtered.json b/annotations_filtered/0BF9MkmTBjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3656b2ad9563c19f2170cdf8f3c931b92b3799d --- /dev/null +++ b/annotations_filtered/0BF9MkmTBjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.13], [21.0, 21.59], [33.0, 33.17], [34.0, 34.7], [36.0, 35.8], [57.0, 59.68], [62.0, 62.24], [69.0, 69.26], [70.0, 70.56], [74.0, 74.55], [78.0, 80.7], [85.0, 85.7], [91.0, 91.05], [93.0, 93.72], [98.0, 99.08]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.33, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 52.22], ["theremin", 4.97], ["crowd", 4.64]], null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.59, 0.17, 0.7, -0.2, 2.68, 0.24, 0.26, 0.56, 0.55, 2.7, 0.7, 0.05, 0.72, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/0BM-Q3BDrkw_filtered.json b/annotations_filtered/0BM-Q3BDrkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb956dc90f8b98665420d8bb0590d47a902fa352 --- /dev/null +++ b/annotations_filtered/0BM-Q3BDrkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.53], [14.0, 17.47], [20.0, 22.45], [25.0, 26.59], [28.0, 31.48], [35.0, 37.47], [41.0, 43.48], [46.0, 48.3], [55.0, 57.79], [62.0, 63.37], [67.0, 68.67], [73.0, 73.4], [78.0, 78.97], [83.0, 84.57], [87.0, 87.71], [89.0, 93.24], [95.0, 98.44], [100.0, 103.35], [107.0, 108.97], [113.0, 113.91], [116.0, 117.75], [122.0, 123.9], [128.0, 128.49], [131.0, 133.17], [136.0, 136.9], [146.0, 147.21], [150.0, 151.39], [155.0, 156.93], [160.0, 163.76], [168.0, 170.28], [174.0, 181.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 98.27, 82.43, 0.0, 99.97, 87.55, 95.64, 76.86, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 90.08, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 0.0, 92.97, 100.0, 92.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.61], ["carnatic music", 3.11], ["musical instrument", 2.39]], null, null, null, null, null, null, null], "duration": [4.53, 3.47, 2.45, 1.59, 3.48, 2.47, 2.48, 2.3, 2.79, 1.37, 1.67, 0.4, 0.97, 1.57, 0.71, 4.24, 3.44, 3.35, 1.97, 0.91, 1.75, 1.9, 0.49, 2.17, 0.9, 1.21, 1.39, 1.93, 3.76, 2.28, 7.9]} \ No newline at end of file diff --git a/annotations_filtered/0BQZb44R_IY_filtered.json b/annotations_filtered/0BQZb44R_IY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c59482dc08a5f82c443a48be5c852cb3f1b83fdd --- /dev/null +++ b/annotations_filtered/0BQZb44R_IY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.95], [14.0, 45.2], [46.0, 62.13], [67.0, 68.32], [69.0, 77.67], [79.0, 106.19], [107.0, 113.31]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.65, 0.0, 69.61, 51.99, 64.07], "audiomae_on_audioset": [null, null, [["music", 77.96], ["harp", 2.04], ["musical instrument", 1.95]], null, null, null, null], "duration": [-0.05, 31.2, 16.13, 1.32, 8.67, 27.19, 6.31]} \ No newline at end of file diff --git a/annotations_filtered/0BXa52qz-kU_filtered.json b/annotations_filtered/0BXa52qz-kU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f9345d8cdb3691c111bf9aecb551e7d5beaa1b --- /dev/null +++ b/annotations_filtered/0BXa52qz-kU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [26.0, 26.03], [39.0, 39.28], [54.0, 56.03], [58.0, 57.65], [58.0, 63.46], [69.0, 69.36], [76.0, 77.38], [79.0, 83.88], [85.0, 90.91], [93.0, 96.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 44.52, 0.0, 0.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 41.82], ["sidetone", 36.58], ["music", 4.78]], null, null, null, null, null], "duration": [1.03, 0.03, 0.28, 2.03, -0.35, 5.46, 0.36, 1.38, 4.88, 5.91, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/0Ba6y1Y8JjU_filtered.json b/annotations_filtered/0Ba6y1Y8JjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02524e0c737216766f43b3ee9177c3d3b102ce51 --- /dev/null +++ b/annotations_filtered/0Ba6y1Y8JjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.99], [9.0, 8.88], [10.0, 10.54], [16.0, 18.15], [21.0, 22.32], [24.0, 29.08], [30.0, 31.53], [38.0, 37.77], [38.0, 40.07], [42.0, 42.89], [46.0, 46.57], [47.0, 48.73], [54.0, 55.32], [57.0, 57.97], [59.0, 59.48], [60.0, 61.25], [63.0, 63.8], [66.0, 68.89], [70.0, 90.49], [91.0, 94.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.27, 0.0, 68.41, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.28, 43.61, 45.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 27.07], ["mains hum", 22.77], ["music", 20.62]], [["speech", 37.82], ["music", 29.41], ["sidetone", 6.69]]], "duration": [1.99, -0.12, 0.54, 2.15, 1.32, 5.08, 1.53, -0.23, 2.07, 0.89, 0.57, 1.73, 1.32, 0.97, 0.48, 1.25, 0.8, 2.89, 20.49, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/0C-qxjiDP1o_filtered.json b/annotations_filtered/0C-qxjiDP1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dffedbcd69ffefce09f90b7f4727ce7ac611e9a1 --- /dev/null +++ b/annotations_filtered/0C-qxjiDP1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [6.0, 14.47], [28.0, 30.45], [40.0, 40.81]], "keep_status": [false, false, false, false], "silence_prob": [98.1, 30.49, 30.57, 0.0], "audiomae_on_audioset": [null, [["music", 68.45], ["synthesizer", 8.6], ["electronic music", 6.37]], [["music", 91.41], ["electronic music", 1.88], ["hip hop music", 1.61]], null], "duration": [3.17, 8.47, 2.45, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/0C4yBk6syOE_filtered.json b/annotations_filtered/0C4yBk6syOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0287ce0bcd765b2fbdc23ba1598660f2d5a6331a --- /dev/null +++ b/annotations_filtered/0C4yBk6syOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [15.0, 14.79], [15.0, 15.67], [18.0, 18.54], [19.0, 20.71], [22.0, 22.99], [25.0, 25.3], [30.0, 29.94], [36.0, 36.59], [38.0, 37.79], [43.0, 44.93], [47.0, 48.36], [51.0, 52.2], [56.0, 56.22], [58.0, 61.21], [62.0, 66.51], [79.0, 78.87], [89.0, 89.53], [104.0, 104.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 34.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.57], ["sidetone", 33.3], ["telephone", 7.37]], [["speech", 79.84], ["telephone", 4.75], ["inside, small room", 2.54]], null, null, null], "duration": [0.6, -0.21, 0.67, 0.54, 1.71, 0.99, 0.3, -0.06, 0.59, -0.21, 1.93, 1.36, 1.2, 0.22, 3.21, 4.51, -0.13, 0.53, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/0C6nvNlVx1A_filtered.json b/annotations_filtered/0C6nvNlVx1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..636bdee09d529b302448f8cf35f170e790541514 --- /dev/null +++ b/annotations_filtered/0C6nvNlVx1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [8.0, 8.85], [11.0, 12.87], [17.0, 16.83], [19.0, 19.5], [23.0, 24.31], [26.0, 26.69], [30.0, 29.83], [34.0, 35.34], [37.0, 46.4], [47.0, 47.43], [49.0, 50.08], [52.0, 54.26], [56.0, 56.73], [59.0, 60.76], [63.0, 65.85], [67.0, 74.12], [75.0, 77.8], [78.0, 78.06], [78.0, 78.16], [78.0, 78.44], [78.0, 78.48], [79.0, 80.43], [80.0, 80.6], [81.0, 80.64], [82.0, 92.33], [100.0, 107.22], [108.0, 108.58], [111.0, 111.59], [124.0, 125.39], [128.0, 128.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 35.09, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 48.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 74.18], ["sidetone", 7.36], ["thunk", 5.44]], null, null, null, null, null, null, [["thunk", 42.85], ["speech", 30.72], ["breaking", 7.36]], null, null, null, null, null, null, null, null, null, [["speech", 30.12], ["arrow", 23.32], ["thunk", 13.16]], null, null, null, null], "duration": [1.24, 0.85, 1.87, -0.17, 0.5, 1.31, 0.69, -0.17, 1.34, 9.4, 0.43, 1.08, 2.26, 0.73, 1.76, 2.85, 7.12, 2.8, 0.06, 0.16, 0.44, 0.48, 1.43, 0.6, -0.36, 10.33, 7.22, 0.58, 0.59, 1.39, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/0CQi2Bb7WE8_filtered.json b/annotations_filtered/0CQi2Bb7WE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c82ec0cbff6e2a8f1220d6874fe8e3ff4baa6d --- /dev/null +++ b/annotations_filtered/0CQi2Bb7WE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.0], [50.0, 50.84], [53.0, 53.37], [55.0, 55.31], [67.0, 67.63], [79.0, 83.59], [85.0, 86.48], [87.0, 86.91]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 42.62], ["speech", 33.04], ["musical instrument", 3.76]], null, null], "duration": [0.0, 0.84, 0.37, 0.31, 0.63, 4.59, 1.48, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/0CYdSfhwWVY_filtered.json b/annotations_filtered/0CYdSfhwWVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94309ccbc1c651cfd99b83dd899e5b7ccb72fc69 --- /dev/null +++ b/annotations_filtered/0CYdSfhwWVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.77], [10.0, 10.18], [34.0, 35.33], [38.0, 40.04], [43.0, 42.89], [43.0, 45.91], [47.0, 47.28], [48.0, 51.21], [51.0, 52.03], [55.0, 55.07], [58.0, 57.92], [58.0, 58.97], [60.0, 61.64], [62.0, 62.36], [64.0, 65.16], [67.0, 67.53], [71.0, 71.81], [85.0, 84.86], [89.0, 89.6], [91.0, 91.12], [92.0, 93.24], [97.0, 96.96], [98.0, 98.91], [102.0, 102.83], [104.0, 106.32], [109.0, 109.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 75.88, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.23, 0.18, 1.33, 2.04, -0.11, 2.91, 0.28, 3.21, 1.03, 0.07, -0.08, 0.97, 1.64, 0.36, 1.16, 0.53, 0.81, -0.14, 0.6, 0.12, 1.24, -0.04, 0.91, 0.83, 2.32, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/0Cufl5Gao98_filtered.json b/annotations_filtered/0Cufl5Gao98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80b8918f2f6634898b29ed8be3baf975ce39e581 --- /dev/null +++ b/annotations_filtered/0Cufl5Gao98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.36], [12.0, 12.02], [12.0, 13.83], [15.0, 17.41], [20.0, 22.57], [23.0, 24.21], [31.0, 34.1], [36.0, 37.08], [37.0, 38.01], [40.0, 41.37], [47.0, 48.69], [52.0, 58.18], [59.0, 59.61], [61.0, 61.84], [63.0, 63.98], [69.0, 70.85], [72.0, 72.5], [77.0, 80.33], [82.0, 83.22], [86.0, 88.92], [92.0, 91.93], [95.0, 95.37], [100.0, 101.88], [103.0, 106.03], [108.0, 111.59], [115.0, 116.41], [117.0, 118.1], [119.0, 120.31], [124.0, 124.82], [127.0, 140.58], [141.0, 140.61], [148.0, 149.4], [165.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.14, 66.39, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 100.0, 0.0, 0.0, 0.0, 99.95, 98.66, 0.0, 0.0, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 74.61], ["boing", 4.4], ["music", 2.26]], null, null, null, null, null, null, null, [["applause", 72.44], ["clapping", 5.36], ["music", 4.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.34], ["applause", 4.44], ["sidetone", 2.31]], null, null, null], "duration": [0.36, 0.02, 1.83, 2.41, 2.57, 1.21, 3.1, 1.08, 1.01, 1.37, 1.69, 6.18, 0.61, 0.84, 0.98, 1.85, 0.5, 3.33, 1.22, 2.92, -0.07, 0.37, 1.88, 3.03, 3.59, 1.41, 1.1, 1.31, 0.82, 13.58, -0.39, 1.4, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/0D35LZ4UBX8_filtered.json b/annotations_filtered/0D35LZ4UBX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0398e55a6b07868211c72e12f384b3ad4d8b8b3 --- /dev/null +++ b/annotations_filtered/0D35LZ4UBX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.5], [21.0, 21.24], [29.0, 30.84], [39.0, 40.98], [43.0, 43.66], [45.0, 45.66], [48.0, 50.19], [58.0, 59.07], [59.0, 65.69], [72.0, 72.06], [73.0, 74.55], [78.0, 79.27], [82.0, 82.26], [84.0, 86.63], [87.0, 88.18], [90.0, 91.54], [102.0, 104.6], [123.0, 123.35], [128.0, 133.12], [136.0, 136.63], [138.0, 140.95], [142.0, 152.05], [157.0, 163.29], [166.0, 166.58], [168.0, 170.31]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [30.28, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 30.7, 0.0, 31.19, 0.0, 81.35, 31.15, 31.25, 0.0, 34.75], "audiomae_on_audioset": [[["speech", 56.96], ["music", 6.34], ["applause", 5.59]], null, null, null, null, null, [["music", 40.55], ["didgeridoo", 40.25], ["musical instrument", 4.2]], null, [["music", 45.88], ["speech", 16.75], ["didgeridoo", 11.92]], null, null, null, null, [["speech", 69.63], ["music", 11.3], ["tap", 4.7]], null, null, [["speech", 39.13], ["music", 28.38], ["tap", 4.33]], null, [["music", 54.08], ["didgeridoo", 8.95], ["musical instrument", 4.2]], null, null, [["music", 53.4], ["didgeridoo", 35.1], ["musical instrument", 2.81]], [["music", 49.59], ["percussion", 11.05], ["didgeridoo", 10.18]], null, [["speech", 30.73], ["sidetone", 14.5], ["whale vocalization", 6.54]]], "duration": [2.5, 0.24, 1.84, 1.98, 0.66, 0.66, 2.19, 1.07, 6.69, 0.06, 1.55, 1.27, 0.26, 2.63, 1.18, 1.54, 2.6, 0.35, 5.12, 0.63, 2.95, 10.05, 6.29, 0.58, 2.31]} \ No newline at end of file diff --git a/annotations_filtered/0D5EL4HLd3g_filtered.json b/annotations_filtered/0D5EL4HLd3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3537dd146f2be1ad63ddde4d057c48b0e811d149 --- /dev/null +++ b/annotations_filtered/0D5EL4HLd3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.97], [22.0, 22.96], [28.0, 29.25], [35.0, 35.48], [42.0, 43.12], [44.0, 44.9], [47.0, 65.21], [66.0, 69.47]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.43, 32.74], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 43.84], ["effects unit", 11.95], ["synthesizer", 10.73]], [["music", 65.68], ["speech", 6.54], ["throbbing", 2.96]]], "duration": [1.97, 0.96, 1.25, 0.48, 1.12, 0.9, 18.21, 3.47]} \ No newline at end of file diff --git a/annotations_filtered/0DFBoLZC3Bw_filtered.json b/annotations_filtered/0DFBoLZC3Bw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b373a4ad43bbd2289337ec578922e49cfb218a3 --- /dev/null +++ b/annotations_filtered/0DFBoLZC3Bw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [8.0, 9.27], [10.0, 11.55], [20.0, 23.65], [28.0, 28.02], [35.0, 39.5], [42.0, 46.21], [48.0, 50.03], [52.0, 51.97], [52.0, 52.1], [76.0, 76.79], [86.0, 89.53], [102.0, 102.47], [103.0, 107.62], [116.0, 116.01], [118.0, 120.72], [128.0, 127.63], [128.0, 128.83], [130.0, 130.22]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.21, 0.0, 43.48, 35.54, 36.62, 0.0, 0.0, 0.0, 86.45, 0.0, 92.8, 0.0, 95.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 16.52], ["mains hum", 14.93], ["music", 13.72]], [["music", 26.29], ["speech", 24.03], ["trombone", 3.97]], [["music", 47.7], ["trombone", 20.5], ["brass instrument", 7.69]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 1.27, 1.55, 3.65, 0.02, 4.5, 4.21, 2.03, -0.03, 0.1, 0.79, 3.53, 0.47, 4.62, 0.01, 2.72, -0.37, 0.83, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/0Dc0Oj08S7M_filtered.json b/annotations_filtered/0Dc0Oj08S7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb6ba680474072108dc3aa291bfd8a71920090e --- /dev/null +++ b/annotations_filtered/0Dc0Oj08S7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.02], [17.0, 17.58], [29.0, 30.11], [31.0, 32.02], [37.0, 37.37], [40.0, 40.37], [41.0, 42.43], [44.0, 45.06], [46.0, 49.47], [50.0, 52.2], [58.0, 59.44], [60.0, 61.01], [62.0, 62.55], [64.0, 64.57], [67.0, 69.97], [71.0, 72.1], [87.0, 87.44], [90.0, 94.19], [96.0, 96.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 70.44, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 58.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.58, 1.11, 1.02, 0.37, 0.37, 1.43, 1.06, 3.47, 2.2, 1.44, 1.01, 0.55, 0.57, 2.97, 1.1, 0.44, 4.19, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/0DnThxPfhJE_filtered.json b/annotations_filtered/0DnThxPfhJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada41c7208a01fa9260827eefcef15ff9d92376d --- /dev/null +++ b/annotations_filtered/0DnThxPfhJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.45], [16.0, 16.58], [20.0, 21.52], [23.0, 24.66], [26.0, 26.18], [28.0, 28.36], [31.0, 31.7], [32.0, 32.34], [37.0, 39.39], [40.0, 39.82], [44.0, 46.82], [48.0, 49.65], [50.0, 53.72], [54.0, 54.08], [54.0, 54.11], [54.0, 54.35], [55.0, 55.49], [58.0, 59.44], [60.0, 60.72], [61.0, 63.31], [68.0, 67.81], [69.0, 69.16], [70.0, 70.71], [73.0, 75.74], [77.0, 78.33], [81.0, 82.07], [83.0, 89.94], [90.0, 92.42], [95.0, 96.33], [100.0, 102.71], [103.0, 103.55], [107.0, 107.32], [110.0, 110.67], [119.0, 119.8], [121.0, 121.14], [122.0, 121.83], [124.0, 124.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 100.0, 0.0, 47.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 0.0, 44.46, 0.0, 0.0, 77.87, 97.33, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.92], ["music", 3.75], ["noise", 1.56]], null, null, null, null, null, null, null, null, null, null, [["music", 17.52], ["coin (dropping)", 11.36], ["door", 6.48]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 0.58, 1.52, 1.66, 0.18, 0.36, 0.7, 0.34, 2.39, -0.18, 2.82, 1.65, 3.72, 0.08, 0.11, 0.35, 0.49, 1.44, 0.72, 2.31, -0.19, 0.16, 0.71, 2.74, 1.33, 1.07, 6.94, 2.42, 1.33, 2.71, 0.55, 0.32, 0.67, 0.8, 0.14, -0.17, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/0Dp--gKKMJ8_filtered.json b/annotations_filtered/0Dp--gKKMJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af2a595e48beb6e3c4da560897488fa944ddb501 --- /dev/null +++ b/annotations_filtered/0Dp--gKKMJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.53], [17.0, 19.21], [20.0, 21.24], [24.0, 23.63], [25.0, 25.52], [28.0, 28.56], [33.0, 34.05], [36.0, 37.1], [40.0, 43.44], [50.0, 55.12], [59.0, 65.53], [69.0, 70.75], [72.0, 73.47], [75.0, 76.0], [86.0, 86.61], [87.0, 86.98], [94.0, 109.32], [119.0, 126.25], [127.0, 127.13], [128.0, 130.23], [131.0, 132.75]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 37.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.28, 33.76, 32.92, 0.0, 0.0, 0.0, 0.0, 0.0, 33.53, 34.75, 0.0, 32.14, 0.0], "audiomae_on_audioset": [null, [["music", 58.91], ["speech", 9.99], ["musical instrument", 6.86]], null, null, null, null, null, null, [["music", 29.92], ["speech", 14.12], ["gobble", 8.87]], [["frog", 28.86], ["croak", 20.26], ["music", 16.56]], [["music", 80.41], ["musical instrument", 3.0], ["swing music", 1.67]], null, null, null, null, null, [["music", 64.29], ["speech", 10.67], ["didgeridoo", 7.42]], [["music", 55.28], ["speech", 23.93], ["didgeridoo", 2.96]], null, [["animal", 12.72], ["livestock, farm animals, working animals", 12.07], ["speech", 11.72]], null], "duration": [1.53, 2.21, 1.24, -0.37, 0.52, 0.56, 1.05, 1.1, 3.44, 5.12, 6.53, 1.75, 1.47, 1.0, 0.61, -0.02, 15.32, 7.25, 0.13, 2.23, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/0Dy2fo6E_pI_filtered.json b/annotations_filtered/0Dy2fo6E_pI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5e67a1bcf6d8d293c3ad21d507b510c0e2e0dce --- /dev/null +++ b/annotations_filtered/0Dy2fo6E_pI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.59], [12.0, 12.68], [14.0, 31.09], [33.0, 34.86], [36.0, 37.69], [38.0, 38.48], [39.0, 48.86], [51.0, 52.41], [55.0, 55.76], [57.0, 58.53], [60.0, 60.71], [63.0, 63.88], [65.0, 65.94], [67.0, 68.18], [70.0, 69.9], [73.0, 74.28], [77.0, 79.46], [82.0, 84.86], [90.0, 92.31], [93.0, 93.77], [94.0, 100.08], [103.0, 103.62], [105.0, 107.18], [108.0, 110.86], [112.0, 117.39], [124.0, 125.68], [127.0, 133.44], [135.0, 135.85], [137.0, 138.94], [141.0, 142.37], [144.0, 151.6], [158.0, 158.5], [161.0, 170.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [34.51, 0.0, 33.7, 0.0, 0.0, 0.0, 36.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 96.89, 51.12, 0.0, 33.6, 0.0, 83.34, 44.23, 32.45, 0.0, 41.98, 0.0, 0.0, 0.0, 35.53, 0.0, 31.05], "audiomae_on_audioset": [[["music", 71.72], ["musical instrument", 3.9], ["synthesizer", 1.92]], null, [["music", 44.78], ["brass instrument", 17.29], ["trombone", 8.91]], null, null, null, [["music", 32.19], ["speech", 29.68], ["foghorn", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["breaking", 17.85], ["fly, housefly", 17.32], ["insect", 10.71]], null, null, [["sidetone", 66.11], ["speech", 8.14], ["music", 2.95]], [["breaking", 55.93], ["crushing", 16.13], ["glass", 4.74]], null, [["fly, housefly", 19.27], ["insect", 16.93], ["bee, wasp, etc.", 13.52]], null, null, null, [["mosquito", 53.11], ["fly, housefly", 22.62], ["insect", 7.78]], null, [["music", 27.02], ["fly, housefly", 25.18], ["fart", 9.31]]], "duration": [4.59, 0.68, 17.09, 1.86, 1.69, 0.48, 9.86, 1.41, 0.76, 1.53, 0.71, 0.88, 0.94, 1.18, -0.1, 1.28, 2.46, 2.86, 2.31, 0.77, 6.08, 0.62, 2.18, 2.86, 5.39, 1.68, 6.44, 0.85, 1.94, 1.37, 7.6, 0.5, 9.11]} \ No newline at end of file diff --git a/annotations_filtered/0EC3NTMOF4Q_filtered.json b/annotations_filtered/0EC3NTMOF4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa41e17e1e6173f9521765cf2c93d3219b0250b6 --- /dev/null +++ b/annotations_filtered/0EC3NTMOF4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.62], [13.0, 13.24], [16.0, 18.13], [20.0, 22.59], [25.0, 25.83], [27.0, 30.08], [32.0, 33.64], [40.0, 41.47], [46.0, 46.94], [49.0, 50.19], [68.0, 68.23], [72.0, 72.13], [87.0, 88.21], [91.0, 91.35], [94.0, 94.71], [100.0, 100.57], [103.0, 103.91], [107.0, 107.35], [108.0, 109.17], [111.0, 111.54], [114.0, 114.25], [115.0, 116.9], [120.0, 121.86], [125.0, 126.84], [130.0, 129.88], [131.0, 131.31], [134.0, 133.83], [138.0, 139.62], [143.0, 148.29], [150.0, 151.73], [153.0, 154.35], [156.0, 157.05], [160.0, 160.69], [163.0, 167.88], [169.0, 169.4], [170.0, 170.63], [173.0, 176.2]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [41.5, 0.0, 40.12, 38.3, 0.0, 32.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.87, 0.0, 0.0, 0.0, 0.0, 35.24, 0.0, 0.0, 43.28], "audiomae_on_audioset": [[["speech", 48.48], ["music", 10.55], ["whale vocalization", 6.92]], null, [["music", 23.89], ["speech", 13.1], ["didgeridoo", 8.09]], [["noise", 36.07], ["radio", 13.26], ["hum", 11.47]], null, [["noise", 33.69], ["theremin", 22.31], ["music", 18.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 30.89], ["music", 20.25], ["hum", 13.06]], null, null, null, null, [["speech", 65.86], ["sidetone", 8.51], ["busy signal", 7.27]], null, null, [["hum", 36.67], ["mains hum", 17.96], ["noise", 12.29]]], "duration": [3.62, 0.24, 2.13, 2.59, 0.83, 3.08, 1.64, 1.47, 0.94, 1.19, 0.23, 0.13, 1.21, 0.35, 0.71, 0.57, 0.91, 0.35, 1.17, 0.54, 0.25, 1.9, 1.86, 1.84, -0.12, 0.31, -0.17, 1.62, 5.29, 1.73, 1.35, 1.05, 0.69, 4.88, 0.4, 0.63, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/0EKDRD2sHI4_filtered.json b/annotations_filtered/0EKDRD2sHI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf4d24fe69e51d57bca9e14fb314f89edd7fbd96 --- /dev/null +++ b/annotations_filtered/0EKDRD2sHI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 26.91], [27.0, 29.08], [30.0, 30.99], [33.0, 33.42], [36.0, 37.57], [39.0, 44.78], [45.0, 54.3], [55.0, 72.45]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [33.28, 52.1, 0.0, 0.0, 0.0, 53.1, 81.17, 31.81], "audiomae_on_audioset": [[["music", 66.32], ["throbbing", 8.51], ["hum", 4.63]], null, null, null, null, null, null, [["civil defense siren", 21.16], ["siren", 15.69], ["music", 13.74]]], "duration": [23.91, 2.08, 0.99, 0.42, 1.57, 5.78, 9.3, 17.45]} \ No newline at end of file diff --git a/annotations_filtered/0EQXnRlIbXs_filtered.json b/annotations_filtered/0EQXnRlIbXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2edb2a33f4f082682b502924f779f0acdc7b3345 --- /dev/null +++ b/annotations_filtered/0EQXnRlIbXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.36], [38.0, 38.75], [42.0, 42.63], [46.0, 47.14], [48.0, 49.64], [54.0, 59.51], [63.0, 77.8], [79.0, 92.25], [93.0, 109.22], [111.0, 128.65], [132.0, 140.53], [143.0, 143.4], [144.0, 144.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [94.07, 0.0, 0.0, 0.0, 0.0, 40.82, 79.07, 67.25, 94.81, 93.6, 99.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 34.61], ["music", 22.12], ["boing", 4.45]], null, null, null, null, null, null, null], "duration": [6.36, 0.75, 0.63, 1.14, 1.64, 5.51, 14.8, 13.25, 16.22, 17.65, 8.53, 0.4, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/0ERIepJUdPc_filtered.json b/annotations_filtered/0ERIepJUdPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d87ddf4417bf94c1ab432cd0c9cce8aee202c2d --- /dev/null +++ b/annotations_filtered/0ERIepJUdPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [3.0, 3.38], [4.0, 4.33], [12.0, 11.67], [12.0, 25.95], [28.0, 35.04], [38.0, 59.46], [64.0, 64.86], [65.0, 70.97], [73.0, 87.1], [89.0, 91.07], [91.0, 95.45], [96.0, 97.14], [97.0, 97.73], [101.0, 103.74], [108.0, 114.98], [115.0, 122.67], [124.0, 138.62], [141.0, 153.35], [156.0, 182.11], [185.0, 187.44], [189.0, 189.03], [189.0, 191.54]], "keep_status": [false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, true, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.18, 29.19, 28.78, 0.0, 28.23, 28.27, 29.83, 29.73, 0.0, 0.0, 30.56, 28.23, 28.3, 29.07, 29.66, 28.36, 29.53, 0.0, 28.65], "audiomae_on_audioset": [null, null, null, null, [["music", 32.88], ["hum", 7.61], ["whale vocalization", 5.94]], [["hum", 41.51], ["whale vocalization", 31.45], ["mains hum", 15.34]], [["hum", 33.59], ["music", 14.5], ["mains hum", 14.27]], null, [["music", 57.77], ["hum", 11.61], ["throbbing", 9.91]], [["music", 64.73], ["throbbing", 11.66], ["electronic music", 6.16]], [["vehicle", 20.01], ["eruption", 15.63], ["fixed-wing aircraft, airplane", 8.3]], [["hum", 36.24], ["mains hum", 27.86], ["speech", 18.65]], null, null, [["speech", 14.38], ["music", 14.37], ["hum", 13.37]], [["music", 22.44], ["mains hum", 16.71], ["hum", 15.75]], [["music", 53.65], ["speech", 8.81], ["electronic music", 4.7]], [["hum", 24.67], ["throbbing", 19.28], ["music", 16.43]], [["hum", 35.95], ["throbbing", 33.64], ["mains hum", 16.4]], [["speech", 37.06], ["vehicle", 33.95], ["motorboat, speedboat", 7.56]], [["speech", 25.16], ["hum", 14.62], ["mains hum", 8.7]], null, [["hum", 25.49], ["mains hum", 20.93], ["throbbing", 16.55]]], "duration": [0.56, 0.38, 0.33, -0.33, 13.95, 7.04, 21.46, 0.86, 5.97, 14.1, 2.07, 4.45, 1.14, 0.73, 2.74, 6.98, 7.67, 14.62, 12.35, 26.11, 2.44, 0.03, 2.54]} \ No newline at end of file diff --git a/annotations_filtered/0FNk4sNdPtQ_filtered.json b/annotations_filtered/0FNk4sNdPtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0f418358bdcecc78797c1ea5f56509a69cfdd92 --- /dev/null +++ b/annotations_filtered/0FNk4sNdPtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.67], [17.0, 17.41], [19.0, 20.14], [27.0, 27.48], [29.0, 35.58], [39.0, 43.46], [45.0, 45.28], [51.0, 50.9], [52.0, 52.86], [55.0, 55.63], [57.0, 57.62], [60.0, 60.76], [62.0, 62.9], [64.0, 66.14], [70.0, 71.42], [75.0, 75.54], [78.0, 78.68], [79.0, 80.15], [82.0, 83.88], [85.0, 86.24], [88.0, 90.46], [96.0, 96.18], [98.0, 101.66], [108.0, 110.76], [116.0, 116.51], [118.0, 122.55]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [40.71, 0.0, 0.0, 0.0, 39.34, 49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.71, 0.0, 37.63, 37.59, 0.0, 32.87], "audiomae_on_audioset": [[["music", 40.74], ["hum", 14.47], ["throbbing", 9.45]], null, null, null, [["music", 40.83], ["synthesizer", 17.75], ["musical instrument", 8.24]], [["music", 61.16], ["hum", 7.17], ["synthesizer", 5.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.76], ["speech", 25.6], ["electronic music", 3.59]], null, [["music", 43.47], ["drum machine", 15.68], ["speech", 12.22]], [["music", 23.1], ["boing", 11.14], ["synthesizer", 8.22]], null, [["boing", 47.73], ["music", 10.28], ["moo", 7.58]]], "duration": [8.67, 0.41, 1.14, 0.48, 6.58, 4.46, 0.28, -0.1, 0.86, 0.63, 0.62, 0.76, 0.9, 2.14, 1.42, 0.54, 0.68, 1.15, 1.88, 1.24, 2.46, 0.18, 3.66, 2.76, 0.51, 4.55]} \ No newline at end of file diff --git a/annotations_filtered/0FkeGnobtfo_filtered.json b/annotations_filtered/0FkeGnobtfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b4df31f53fcd5f8e21572a754d717ef9f56f6e6 --- /dev/null +++ b/annotations_filtered/0FkeGnobtfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.71], [16.0, 33.62], [34.0, 57.0], [61.0, 61.32], [62.0, 124.21], [126.0, 126.77]], "keep_status": [false, true, true, false, false, false], "silence_prob": [0.0, 38.76, 40.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 48.6], ["mains hum", 14.97], ["throbbing", 6.37]], [["music", 49.24], ["ambient music", 5.74], ["foghorn", 2.9]], null, null, null], "duration": [1.71, 17.62, 23.0, 0.32, 62.21, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/0GCwhGQEZ90_filtered.json b/annotations_filtered/0GCwhGQEZ90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..924bfe2902068cc1d008769ed532415a88491daa --- /dev/null +++ b/annotations_filtered/0GCwhGQEZ90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [6.0, 29.76], [32.0, 34.21], [35.0, 40.88], [45.0, 46.62], [49.0, 51.16], [55.0, 54.92], [61.0, 61.74], [75.0, 75.37], [80.0, 86.71], [94.0, 95.22], [99.0, 99.52], [101.0, 101.31], [105.0, 105.29], [109.0, 108.82], [152.0, 158.58], [160.0, 161.05], [171.0, 174.29], [183.0, 185.38], [186.0, 187.47], [190.0, 190.83], [193.0, 194.26], [194.0, 197.5], [200.0, 201.77], [211.0, 213.07], [213.0, 213.24]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.86, 98.66, 31.94, 0.0, 32.78, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 29.5, 0.0, 29.98, 94.37, 0.0, 0.0, 0.0, 40.81, 0.0, 29.57, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.37], ["livestock, farm animals, working animals", 12.18], ["animal", 8.52]], null, [["livestock, farm animals, working animals", 57.83], ["cattle, bovinae", 26.82], ["moo", 10.14]], null, null, null, null, null, null, null, null, null, [["speech", 25.82], ["sidetone", 12.83], ["throbbing", 7.7]], null, [["music", 37.67], ["speech", 10.59], ["throbbing", 4.47]], null, null, null, null, [["throbbing", 30.67], ["hum", 22.03], ["music", 17.87]], null, [["groan", 51.09], ["music", 14.25], ["speech", 11.85]], null], "duration": [1.54, 23.76, 2.21, 5.88, 1.62, 2.16, -0.08, 0.74, 0.37, 6.71, 1.22, 0.52, 0.31, 0.29, -0.18, 6.58, 1.05, 3.29, 2.38, 1.47, 0.83, 1.26, 3.5, 1.77, 2.07, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/0GEynXlmNYA_filtered.json b/annotations_filtered/0GEynXlmNYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecbd767535826cb61cf350e6df454b831646b376 --- /dev/null +++ b/annotations_filtered/0GEynXlmNYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.96], [15.0, 17.39], [20.0, 20.14], [21.0, 21.37], [25.0, 24.7], [28.0, 28.88], [36.0, 36.64], [39.0, 39.04], [46.0, 46.8], [51.0, 51.33], [53.0, 54.8], [58.0, 58.41], [63.0, 63.54], [79.0, 79.59], [84.0, 84.64], [96.0, 97.46], [104.0, 105.26], [126.0, 126.89], [128.0, 130.98]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.05], "audiomae_on_audioset": [null, [["cattle, bovinae", 15.81], ["moo", 13.28], ["music", 11.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.58], ["electronic music", 2.73], ["theremin", 2.42]]], "duration": [1.96, 2.39, 0.14, 0.37, -0.3, 0.88, 0.64, 0.04, 0.8, 0.33, 1.8, 0.41, 0.54, 0.59, 0.64, 1.46, 1.26, 0.89, 2.98]} \ No newline at end of file diff --git a/annotations_filtered/0GGOfY9uE1Y_filtered.json b/annotations_filtered/0GGOfY9uE1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc01e90587164c1c0cc0ccb7a9487e82147c4a85 --- /dev/null +++ b/annotations_filtered/0GGOfY9uE1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.18], [9.0, 10.25], [16.0, 17.0], [18.0, 19.16], [29.0, 30.37], [34.0, 33.62], [35.0, 35.19], [39.0, 38.67], [47.0, 47.36], [60.0, 61.47], [68.0, 67.88], [78.0, 77.85], [83.0, 82.86], [86.0, 87.3], [88.0, 88.45], [94.0, 95.27], [96.0, 96.75], [98.0, 98.88], [101.0, 101.28], [103.0, 105.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["croak", 23.14], ["frog", 18.5], ["fly, housefly", 11.41]]], "duration": [1.18, 1.25, 1.0, 1.16, 1.37, -0.38, 0.19, -0.33, 0.36, 1.47, -0.12, -0.15, -0.14, 1.3, 0.45, 1.27, 0.75, 0.88, 0.28, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/0GYwcr3RD_k_filtered.json b/annotations_filtered/0GYwcr3RD_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12ce1fd7629caf54691c54fff35047b4a52fb5d4 --- /dev/null +++ b/annotations_filtered/0GYwcr3RD_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.05], [14.0, 14.49], [15.0, 17.32], [18.0, 19.43], [21.0, 21.76], [23.0, 24.75], [28.0, 28.75], [30.0, 31.11], [35.0, 35.97], [37.0, 38.18], [39.0, 41.03], [50.0, 50.53], [52.0, 52.57], [59.0, 59.46], [60.0, 61.06], [62.0, 63.39], [65.0, 65.94], [67.0, 68.32], [70.0, 72.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.49, 2.32, 1.43, 0.76, 1.75, 0.75, 1.11, 0.97, 1.18, 2.03, 0.53, 0.57, 0.46, 1.06, 1.39, 0.94, 1.32, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/0GiMAf9q3hQ_filtered.json b/annotations_filtered/0GiMAf9q3hQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d13ef05e03b023e7562bd654c0ea26c1ec658f3 --- /dev/null +++ b/annotations_filtered/0GiMAf9q3hQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 12.01], [13.0, 14.47], [15.0, 16.26], [18.0, 18.01], [23.0, 24.31], [26.0, 27.65], [37.0, 37.23], [42.0, 48.19], [56.0, 57.21], [58.0, 59.41], [65.0, 65.87], [67.0, 67.54], [74.0, 75.49], [77.0, 90.14]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 30.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.62, 0.0, 0.0, 0.0, 0.0, 0.0, 29.64], "audiomae_on_audioset": [null, [["music", 29.06], ["livestock, farm animals, working animals", 14.39], ["moo", 11.68]], null, null, null, null, null, null, [["music", 56.8], ["musical instrument", 7.3], ["guitar", 3.98]], null, null, null, null, null, [["music", 75.08], ["musical instrument", 3.33], ["didgeridoo", 1.66]]], "duration": [0.16, 2.01, 1.47, 1.26, 0.01, 1.31, 1.65, 0.23, 6.19, 1.21, 1.41, 0.87, 0.54, 1.49, 13.14]} \ No newline at end of file diff --git a/annotations_filtered/0Gq5R5ffrtE_filtered.json b/annotations_filtered/0Gq5R5ffrtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0Gq5R5ffrtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0H8EmzfVSbg_filtered.json b/annotations_filtered/0H8EmzfVSbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01b1ae79a6cbc2f0249f57449b4fe601cc6912dd --- /dev/null +++ b/annotations_filtered/0H8EmzfVSbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.34], [8.0, 9.49], [20.0, 20.39], [23.0, 23.28], [37.0, 37.23], [38.0, 45.96], [46.0, 51.41], [53.0, 54.43], [56.0, 57.35], [74.0, 73.84], [83.0, 88.32], [92.0, 93.68], [94.0, 103.25], [105.0, 106.78], [118.0, 117.86], [123.0, 123.9], [124.0, 125.25], [126.0, 129.83], [130.0, 130.59], [131.0, 131.53], [135.0, 135.62], [136.0, 135.65], [136.0, 137.3], [138.0, 138.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.94, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 1.49, 0.39, 0.28, 0.23, 7.96, 5.41, 1.43, 1.35, -0.16, 5.32, 1.68, 9.25, 1.78, -0.14, 0.9, 1.25, 3.83, 0.59, 0.53, 0.62, -0.35, 1.3, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/0I1Vh-Ru1z0_filtered.json b/annotations_filtered/0I1Vh-Ru1z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..411c2a8eb2570a66ae02786f2843236858656d9a --- /dev/null +++ b/annotations_filtered/0I1Vh-Ru1z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.13], [10.0, 15.48], [18.0, 18.57], [25.0, 25.29], [33.0, 32.91], [36.0, 35.94], [41.0, 41.32], [42.0, 44.34], [45.0, 47.21], [48.0, 50.65], [52.0, 53.52], [55.0, 55.19], [56.0, 56.78], [58.0, 58.53], [61.0, 61.79], [63.0, 63.31], [67.0, 68.07], [74.0, 73.97], [76.0, 78.92], [79.0, 82.38], [83.0, 83.32], [85.0, 85.51], [87.0, 87.1], [89.0, 90.44], [91.0, 91.54], [95.0, 95.98], [97.0, 97.39], [98.0, 98.93], [102.0, 102.9], [104.0, 104.9], [107.0, 113.19], [115.0, 115.2], [117.0, 121.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.88, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 99.99, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.03, 0.0, 43.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.1], ["didgeridoo", 8.41], ["musical instrument", 5.05]], null, [["music", 17.28], ["mains hum", 15.73], ["didgeridoo", 11.53]]], "duration": [6.13, 5.48, 0.57, 0.29, -0.09, -0.06, 0.32, 2.34, 2.21, 2.65, 1.52, 0.19, 0.78, 0.53, 0.79, 0.31, 1.07, -0.03, 2.92, 3.38, 0.32, 0.51, 0.1, 1.44, 0.54, 0.98, 0.39, 0.93, 0.9, 0.9, 6.19, 0.2, 4.93]} \ No newline at end of file diff --git a/annotations_filtered/0I7GjbhDYtM_filtered.json b/annotations_filtered/0I7GjbhDYtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3417ac2a22fea592e345f78c032b77adee8fc665 --- /dev/null +++ b/annotations_filtered/0I7GjbhDYtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [6.0, 7.4], [10.0, 12.31], [16.0, 17.85], [19.0, 24.31], [25.0, 25.41], [29.0, 30.23], [30.0, 31.35], [35.0, 35.83], [38.0, 38.45], [39.0, 39.45], [41.0, 41.5], [42.0, 46.11], [49.0, 48.84], [52.0, 54.14], [55.0, 56.91], [59.0, 66.56], [67.0, 71.12], [74.0, 75.42], [78.0, 79.03], [80.0, 80.49], [81.0, 81.14], [82.0, 82.22], [83.0, 83.15], [84.0, 84.82], [88.0, 88.72], [91.0, 91.23], [92.0, 92.87], [93.0, 95.62], [96.0, 95.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.64, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 1.4, 2.31, 1.85, 5.31, 0.41, 1.23, 1.35, 0.83, 0.45, 0.45, 0.5, 4.11, -0.16, 2.14, 1.91, 7.56, 4.12, 1.42, 1.03, 0.49, 0.14, 0.22, 0.15, 0.82, 0.72, 0.23, 0.87, 2.62, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/0IP7ihJrrqw_filtered.json b/annotations_filtered/0IP7ihJrrqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c2b29650a180d997ad0ced2c8e3c97a24d82722 --- /dev/null +++ b/annotations_filtered/0IP7ihJrrqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.85], [6.0, 9.68], [10.0, 11.08], [12.0, 12.11], [13.0, 13.68], [14.0, 14.44], [15.0, 17.12], [24.0, 26.42], [27.0, 28.68], [31.0, 31.83], [38.0, 38.72], [42.0, 50.06], [59.0, 59.05], [64.0, 64.05], [67.0, 68.52], [84.0, 84.16], [86.0, 85.77], [88.0, 88.05], [97.0, 97.46], [99.0, 99.4], [108.0, 108.92], [118.0, 118.72]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.23, 44.55, 0.0, 0.0, 0.0, 0.0, 41.44, 99.21, 0.0, 0.0, 0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 29.35], ["livestock, farm animals, working animals", 20.07], ["cattle, bovinae", 18.2]], [["speech", 18.77], ["whale vocalization", 11.87], ["croak", 6.73]], null, null, null, null, [["frog", 27.7], ["fowl", 20.14], ["speech", 12.67]], null, null, null, null, [["music", 30.79], ["brass instrument", 25.15], ["trombone", 11.13]], null, null, null, null, null, null, null, null, null, null], "duration": [2.85, 3.68, 1.08, 0.11, 0.68, 0.44, 2.12, 2.42, 1.68, 0.83, 0.72, 8.06, 0.05, 0.05, 1.52, 0.16, -0.23, 0.05, 0.46, 0.4, 0.92, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/0IQgjMYWVGc_filtered.json b/annotations_filtered/0IQgjMYWVGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..455ccdd17c81d6a50568781b8d5370d05cc3573f --- /dev/null +++ b/annotations_filtered/0IQgjMYWVGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.8], [24.0, 26.54], [28.0, 28.85], [31.0, 55.65], [57.0, 59.07], [60.0, 61.28], [63.0, 80.27], [97.0, 97.31], [98.0, 98.64], [100.0, 101.63], [103.0, 103.94], [105.0, 106.96], [107.0, 107.72], [109.0, 108.89], [111.0, 119.8], [124.0, 138.3], [141.0, 143.29]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [41.05, 52.68, 0.0, 35.08, 100.0, 0.0, 31.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 46.54, 42.48], "audiomae_on_audioset": [[["music", 41.07], ["hum", 8.2], ["noise", 5.53]], null, null, [["music", 46.64], ["thunk", 10.38], ["hum", 10.26]], null, null, [["music", 42.31], ["hum", 17.83], ["mains hum", 11.14]], null, null, null, null, null, null, null, [["hum", 54.29], ["throbbing", 16.04], ["music", 13.94]], [["music", 37.02], ["hum", 15.31], ["throbbing", 10.28]], [["music", 40.5], ["hum", 14.54], ["throbbing", 13.53]]], "duration": [9.8, 2.54, 0.85, 24.65, 2.07, 1.28, 17.27, 0.31, 0.64, 1.63, 0.94, 1.96, 0.72, -0.11, 8.8, 14.3, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/0IVFxW63RxU_filtered.json b/annotations_filtered/0IVFxW63RxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0c797d2b956fc2ec325dc5ec3b27aa951fd3df8 --- /dev/null +++ b/annotations_filtered/0IVFxW63RxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.81], [26.0, 27.09]], "keep_status": [true, false], "silence_prob": [30.35, 0.0], "audiomae_on_audioset": [[["music", 32.79], ["throbbing", 25.28], ["hum", 10.5]], null], "duration": [3.81, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/0IWdfqsImMU_filtered.json b/annotations_filtered/0IWdfqsImMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36c6ea44df5ce42ec11a676bb43c27c720a1c9c8 --- /dev/null +++ b/annotations_filtered/0IWdfqsImMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.45], [19.0, 25.49], [29.0, 29.32], [33.0, 37.03], [40.0, 41.13]], "keep_status": [false, true, false, true, false], "silence_prob": [31.49, 40.45, 0.0, 30.97, 0.0], "audiomae_on_audioset": [[["speech", 48.13], ["music", 18.63], ["sidetone", 8.38]], [["music", 47.89], ["cattle, bovinae", 3.52], ["livestock, farm animals, working animals", 3.49]], null, [["music", 40.9], ["musical instrument", 7.29], ["noise", 3.86]], null], "duration": [14.45, 6.49, 0.32, 4.03, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/0IWmniYe7aI_filtered.json b/annotations_filtered/0IWmniYe7aI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d5eff34b7cad92b07a0975ccb688ee2e6f0f7b --- /dev/null +++ b/annotations_filtered/0IWmniYe7aI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.95], [15.0, 27.99], [30.0, 30.75], [31.0, 31.48], [32.0, 40.98], [42.0, 47.85], [50.0, 50.84], [55.0, 54.92], [58.0, 60.15], [66.0, 66.46], [68.0, 69.11], [79.0, 79.46], [81.0, 81.4], [83.0, 84.21], [86.0, 87.03], [89.0, 89.45], [90.0, 90.69], [93.0, 97.24], [98.0, 98.79], [104.0, 112.53], [114.0, 114.54], [120.0, 120.53], [124.0, 126.25]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 31.02, 0.0, 0.0, 31.01, 31.77, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 35.39, 0.0, 0.0, 39.27], "audiomae_on_audioset": [null, [["music", 62.39], ["throbbing", 8.19], ["electronic music", 5.14]], null, null, [["fly, housefly", 36.07], ["mosquito", 31.11], ["insect", 15.92]], [["music", 59.25], ["mains hum", 4.97], ["hum", 3.78]], null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 24.01], ["music", 21.82], ["fly, housefly", 16.28]], null, [["music", 67.78], ["synthesizer", 7.67], ["didgeridoo", 2.47]], null, null, [["music", 62.75], ["synthesizer", 10.52], ["musical instrument", 8.18]]], "duration": [0.95, 12.99, 0.75, 0.48, 8.98, 5.85, 0.84, -0.08, 2.15, 0.46, 1.11, 0.46, 0.4, 1.21, 1.03, 0.45, 0.69, 4.24, 0.79, 8.53, 0.54, 0.53, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/0IiCOhajpS8_filtered.json b/annotations_filtered/0IiCOhajpS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6183628173a505683e96da0afc8af6b10104a0ef --- /dev/null +++ b/annotations_filtered/0IiCOhajpS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.93], [9.0, 10.72], [11.0, 42.09], [43.0, 45.54], [47.0, 46.85], [50.0, 57.18], [58.0, 61.26], [63.0, 73.16], [74.0, 78.38], [79.0, 118.74], [120.0, 152.51]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false], "silence_prob": [94.37, 0.0, 0.0, 34.8, 0.0, 37.06, 39.66, 41.93, 44.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 37.06], ["theremin", 3.76], ["speech", 3.48]], null, [["music", 54.68], ["percussion", 3.63], ["musical instrument", 2.79]], [["music", 62.03], ["musical instrument", 6.19], ["didgeridoo", 5.9]], [["music", 66.94], ["musical instrument", 6.19], ["theremin", 5.56]], [["speech", 28.89], ["music", 23.87], ["singing bowl", 6.21]], null, null], "duration": [3.93, 1.72, 31.09, 2.54, -0.15, 7.18, 3.26, 10.16, 4.38, 39.74, 32.51]} \ No newline at end of file diff --git a/annotations_filtered/0IuOpt3p3WE_filtered.json b/annotations_filtered/0IuOpt3p3WE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f5cdf30fca4852225b43228cc5697aed30498a2 --- /dev/null +++ b/annotations_filtered/0IuOpt3p3WE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 19.08], [34.0, 33.89], [35.0, 35.67], [37.0, 39.12], [41.0, 42.26], [44.0, 44.46], [51.0, 53.57], [57.0, 57.3], [58.0, 58.18], [59.0, 59.61], [60.0, 60.67], [61.0, 74.41], [81.0, 82.68], [85.0, 100.82], [101.0, 101.44], [101.0, 101.58], [102.0, 101.82], [102.0, 101.85], [102.0, 143.02], [146.0, 146.75], [148.0, 148.36], [159.0, 160.1], [168.0, 168.52], [170.0, 170.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0, 0.0, 29.53, 0.0, 29.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 57.74], ["music", 12.85], ["speech synthesizer", 2.36]], null, null, null, null, [["music", 88.1], ["electronic music", 1.44], ["male singing", 0.89]], null, [["music", 85.1], ["electronic music", 1.52], ["funny music", 1.46]], null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.08, -0.11, 0.67, 2.12, 1.26, 0.46, 2.57, 0.3, 0.18, 0.61, 0.67, 13.41, 1.68, 15.82, 0.44, 0.58, -0.18, -0.15, 41.02, 0.75, 0.36, 1.1, 0.52, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/0IxeTLiovq8_filtered.json b/annotations_filtered/0IxeTLiovq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..562000581d6a9e9cd4576a8e0ae03318d71cd231 --- /dev/null +++ b/annotations_filtered/0IxeTLiovq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.74], [14.0, 15.99], [19.0, 37.13], [43.0, 76.22], [79.0, 85.13]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.02, 0.0, 30.3], "audiomae_on_audioset": [null, null, [["music", 62.06], ["livestock, farm animals, working animals", 13.1], ["cattle, bovinae", 6.39]], null, [["music", 74.48], ["middle eastern music", 3.45], ["musical instrument", 2.6]]], "duration": [0.74, 1.99, 18.13, 33.22, 6.13]} \ No newline at end of file diff --git a/annotations_filtered/0IyuK069I-w_filtered.json b/annotations_filtered/0IyuK069I-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6905d2d31e09795c4a80111243d3ec9b986052af --- /dev/null +++ b/annotations_filtered/0IyuK069I-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [18.0, 18.89], [30.0, 30.54], [40.0, 40.66], [63.0, 65.75], [90.0, 90.68], [91.0, 90.86], [91.0, 92.4], [107.0, 108.85], [134.0, 134.5], [139.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 0.0, 0.0, 0.0, 0.0, 34.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 31.9], ["whack, thwack", 6.26], ["hum", 5.38]]], "duration": [0.67, 0.89, 0.54, 0.66, 2.75, 0.68, -0.14, 1.4, 1.85, 0.5, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/0J4K03Owgwc_filtered.json b/annotations_filtered/0J4K03Owgwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0J4K03Owgwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0JBU9hgQ_T0_filtered.json b/annotations_filtered/0JBU9hgQ_T0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a196c69a6e0af081b1e511f5eb40888a035ff9d --- /dev/null +++ b/annotations_filtered/0JBU9hgQ_T0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.29], [27.0, 30.1], [30.0, 30.7], [42.0, 50.89], [52.0, 67.74], [69.0, 80.49], [82.0, 83.4], [86.0, 93.29], [95.0, 105.22], [106.0, 107.37], [109.0, 109.38], [110.0, 110.47], [111.0, 121.12], [124.0, 124.95], [126.0, 127.53], [130.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [44.09, 36.72, 0.0, 33.57, 32.53, 33.09, 0.0, 30.73, 30.81, 0.0, 0.0, 0.0, 36.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 64.85], ["hum", 27.85], ["buzz", 1.01]], [["music", 35.56], ["speech", 28.83], ["didgeridoo", 7.29]], null, [["speech", 56.0], ["music", 25.93], ["didgeridoo", 3.61]], [["speech", 35.22], ["music", 30.81], ["whack, thwack", 9.21]], [["speech", 47.87], ["music", 35.62], ["musical instrument", 1.55]], null, [["music", 51.17], ["speech", 19.38], ["synthesizer", 9.1]], [["music", 48.74], ["speech", 13.25], ["didgeridoo", 10.18]], null, null, null, [["speech", 26.83], ["hum", 24.15], ["music", 17.78]], null, null, null], "duration": [15.29, 3.1, 0.7, 8.89, 15.74, 11.49, 1.4, 7.29, 10.22, 1.37, 0.38, 0.47, 10.12, 0.95, 1.53, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/0JDyXQvCsOM_filtered.json b/annotations_filtered/0JDyXQvCsOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42264d28c82022920fe6af3c9dc55fb53078fc03 --- /dev/null +++ b/annotations_filtered/0JDyXQvCsOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [6.0, 17.86], [20.0, 33.08], [33.0, 33.4], [33.0, 33.44], [33.0, 34.25], [34.0, 34.45], [34.0, 56.79], [68.0, 68.28], [69.0, 69.09], [76.0, 76.98], [95.0, 95.5], [110.0, 111.3], [112.0, 112.02], [112.0, 114.35], [117.0, 118.34], [119.0, 121.56], [122.0, 123.13], [124.0, 127.63], [129.0, 129.93], [131.0, 131.4], [135.0, 135.8], [136.0, 141.25]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.64, 92.64, 0.0, 0.0, 0.0, 0.0, 41.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 98.59, 0.0, 87.37, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 36.57], ["livestock, farm animals, working animals", 22.62], ["cattle, bovinae", 7.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 11.86, 13.08, 0.4, 0.44, 1.25, 0.45, 22.79, 0.28, 0.09, 0.98, 0.5, 1.3, 0.02, 2.35, 1.34, 2.56, 1.13, 3.63, 0.93, 0.4, 0.8, 5.25]} \ No newline at end of file diff --git a/annotations_filtered/0JVZ0bE8hpk_filtered.json b/annotations_filtered/0JVZ0bE8hpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc978756a4bf74100179e1cb8e315f0ebb3fa3f --- /dev/null +++ b/annotations_filtered/0JVZ0bE8hpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [6.0, 15.04], [17.0, 33.62], [36.0, 59.05], [60.0, 75.86], [82.0, 91.25], [96.0, 101.49], [102.0, 102.71], [104.0, 105.16], [107.0, 107.89], [109.0, 109.88]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.24, 32.64, 32.44, 31.82, 32.06, 31.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.99], ["didgeridoo", 11.34], ["speech", 6.64]], [["music", 36.68], ["speech", 26.41], ["synthesizer", 9.67]], [["music", 28.65], ["echo", 16.57], ["effects unit", 6.85]], [["music", 57.02], ["hum", 7.49], ["didgeridoo", 6.0]], [["music", 69.93], ["musical instrument", 7.74], ["effects unit", 3.03]], [["music", 51.4], ["hum", 13.99], ["throbbing", 4.61]], null, null, null, null], "duration": [1.97, 9.04, 16.62, 23.05, 15.86, 9.25, 5.49, 0.71, 1.16, 0.89, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/0JXwzlRcYWk_filtered.json b/annotations_filtered/0JXwzlRcYWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89da491a77f03b4acd62acc57987e7ff4d4ac443 --- /dev/null +++ b/annotations_filtered/0JXwzlRcYWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.64], [21.0, 21.73], [23.0, 24.21], [29.0, 29.29], [34.0, 34.18], [35.0, 35.48], [37.0, 37.79], [39.0, 39.5], [42.0, 43.12], [44.0, 45.77], [46.0, 46.67], [48.0, 48.64], [51.0, 63.81], [65.0, 65.94], [67.0, 67.63], [71.0, 72.37], [75.0, 75.71], [78.0, 79.03], [80.0, 80.7], [81.0, 82.34], [83.0, 83.67], [84.0, 86.19], [87.0, 87.32], [91.0, 91.59], [92.0, 92.25], [95.0, 96.36], [103.0, 104.52], [111.0, 111.15], [112.0, 113.75], [115.0, 114.84], [119.0, 118.74], [119.0, 119.06], [122.0, 123.25], [125.0, 125.74], [130.0, 132.8], [135.0, 135.33], [137.0, 137.61], [138.0, 139.51], [140.0, 140.39], [142.0, 142.72], [145.0, 146.3], [147.0, 147.46], [149.0, 149.79], [151.0, 151.77], [157.0, 157.57], [158.0, 158.63]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 16.02], ["music", 11.98], ["sine wave", 10.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.64, 0.73, 1.21, 0.29, 0.18, 0.48, 0.79, 0.5, 1.12, 1.77, 0.67, 0.64, 12.81, 0.94, 0.63, 1.37, 0.71, 1.03, 0.7, 1.34, 0.67, 2.19, 0.32, 0.59, 0.25, 1.36, 1.52, 0.15, 1.75, -0.16, -0.26, 0.06, 1.25, 0.74, 2.8, 0.33, 0.61, 1.51, 0.39, 0.72, 1.3, 0.46, 0.79, 0.77, 0.57, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/0J_lTFS0ouM_filtered.json b/annotations_filtered/0J_lTFS0ouM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc5aa66087276e3052ec39ec81b9cfcd24d744fc --- /dev/null +++ b/annotations_filtered/0J_lTFS0ouM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [8.0, 10.81], [12.0, 18.17], [19.0, 37.35], [44.0, 49.4], [51.0, 51.92], [53.0, 53.49], [55.0, 60.37], [62.0, 63.46], [65.0, 65.91], [68.0, 69.67], [70.0, 77.48], [78.0, 78.61], [79.0, 100.52], [102.0, 104.33], [105.0, 106.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.98, 99.21, 43.2, 93.76, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 58.47, 0.0, 56.78, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, [["insect", 28.93], ["fly, housefly", 27.19], ["bee, wasp, etc.", 27.18]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 2.81, 6.17, 18.35, 5.4, 0.92, 0.49, 5.37, 1.46, 0.91, 1.67, 7.48, 0.61, 21.52, 2.33, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/0JmETteiVzo_filtered.json b/annotations_filtered/0JmETteiVzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..242f22210d6f70f9094f6f777352b2d856f6b107 --- /dev/null +++ b/annotations_filtered/0JmETteiVzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.38], [23.0, 24.92], [50.0, 50.3], [52.0, 52.79], [55.0, 57.7], [59.0, 61.64], [62.0, 64.74], [67.0, 70.93], [84.0, 85.36], [88.0, 87.83], [89.0, 90.64], [93.0, 93.12], [99.0, 102.64], [105.0, 106.76], [112.0, 113.7], [115.0, 114.96], [117.0, 118.39], [120.0, 119.79], [122.0, 122.69], [124.0, 123.96], [126.0, 126.54], [132.0, 132.56]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [60.23, 0.0, 0.0, 0.0, 58.47, 74.29, 34.9, 46.09, 0.0, 0.0, 0.0, 0.0, 37.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 26.46], ["fly, housefly", 17.34], ["sidetone", 14.88]], [["speech", 28.33], ["fly, housefly", 23.34], ["insect", 12.54]], null, null, null, null, [["music", 15.27], ["hum", 8.77], ["fly, housefly", 7.55]], null, null, null, null, null, null, null, null, null], "duration": [3.38, 1.92, 0.3, 0.79, 2.7, 2.64, 2.74, 3.93, 1.36, -0.17, 1.64, 0.12, 3.64, 1.76, 1.7, -0.04, 1.39, -0.21, 0.69, -0.04, 0.54, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/0JoIRmQW2es_filtered.json b/annotations_filtered/0JoIRmQW2es_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9cc445def16c1b7d75aa01abdc5dcd6538fe625 --- /dev/null +++ b/annotations_filtered/0JoIRmQW2es_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [8.0, 8.5], [9.0, 9.96], [16.0, 16.66], [22.0, 22.72], [25.0, 25.54], [26.0, 26.28], [27.0, 27.18], [30.0, 30.4], [33.0, 33.49], [35.0, 35.72], [38.0, 38.15], [44.0, 44.37], [44.0, 45.1], [47.0, 47.73], [58.0, 58.48], [61.0, 60.66], [61.0, 61.45], [63.0, 64.15], [65.0, 65.77], [68.0, 68.81], [71.0, 70.71], [74.0, 74.14], [82.0, 83.35], [85.0, 84.75], [86.0, 86.46], [89.0, 89.14], [90.0, 89.9], [93.0, 94.04], [101.0, 101.56], [116.0, 117.56], [120.0, 121.51], [123.0, 124.04], [125.0, 124.83], [136.0, 136.14], [136.0, 136.39], [142.0, 142.01], [151.0, 157.69], [166.0, 165.99], [166.0, 167.29], [168.0, 168.64], [171.0, 171.69], [173.0, 173.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 17.4], ["music", 15.22], ["animal", 3.03]], null, null, null, null, null], "duration": [0.24, 0.5, 0.96, 0.66, 0.72, 0.54, 0.28, 0.18, 0.4, 0.49, 0.72, 0.15, 0.37, 1.1, 0.73, 0.48, -0.34, 0.45, 1.15, 0.77, 0.81, -0.29, 0.14, 1.35, -0.25, 0.46, 0.14, -0.1, 1.04, 0.56, 1.56, 1.51, 1.04, -0.17, 0.14, 0.39, 0.01, 6.69, -0.01, 1.29, 0.64, 0.69, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/0K6bVf4ra1w_filtered.json b/annotations_filtered/0K6bVf4ra1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bcb445c7d9e283a5c8aee3e12cf4bfe7e48dab7 --- /dev/null +++ b/annotations_filtered/0K6bVf4ra1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 29.81], [34.0, 34.18], [35.0, 38.57], [48.0, 94.58], [95.0, 112.77], [114.0, 114.0]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.85, 0.0, 30.03, 0.0, 30.18, 0.0], "audiomae_on_audioset": [[["music", 22.91], ["speech", 16.23], ["sidetone", 12.95]], null, [["music", 63.29], ["speech", 9.11], ["cacophony", 7.77]], null, [["speech", 40.35], ["music", 36.74], ["smash, crash", 2.36]], null], "duration": [21.81, 0.18, 3.57, 46.58, 17.77, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/0KA8Qkw3nks_filtered.json b/annotations_filtered/0KA8Qkw3nks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0KA8Qkw3nks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0KjO3YwlhEE_filtered.json b/annotations_filtered/0KjO3YwlhEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fc5b7ac29e654cf4a5e6344e7508c932964480d --- /dev/null +++ b/annotations_filtered/0KjO3YwlhEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.15], [11.0, 12.06], [21.0, 21.68], [24.0, 25.3], [26.0, 26.84], [31.0, 31.56], [34.0, 35.18], [36.0, 37.08], [38.0, 40.32], [42.0, 43.39], [45.0, 46.92], [51.0, 50.9], [52.0, 53.99], [55.0, 57.55], [59.0, 59.27], [60.0, 60.61], [61.0, 61.26], [63.0, 63.68], [67.0, 69.11], [70.0, 74.85], [77.0, 82.39], [85.0, 90.59], [92.0, 93.63], [96.0, 97.68], [102.0, 107.84], [110.0, 111.43], [117.0, 122.61], [126.0, 142.84], [145.0, 146.15], [149.0, 151.17], [153.0, 158.14], [160.0, 165.62], [167.0, 191.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 43.85, 33.67, 33.77, 37.23, 0.0, 0.0, 47.23, 0.0, 33.22, 34.32, 0.0, 57.97, 75.72, 93.76, 35.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.32], ["musical instrument", 4.39], ["singing", 2.72]], null, null, null, null, [["music", 65.95], ["musical instrument", 6.09], ["guitar", 4.58]], [["music", 81.9], ["humming", 4.94], ["yodeling", 4.12]], [["music", 78.22], ["carnatic music", 3.66], ["singing", 2.76]], [["music", 61.93], ["guitar", 4.95], ["musical instrument", 4.4]], null, null, [["music", 41.72], ["bass guitar", 11.96], ["guitar", 11.86]], null, [["music", 64.76], ["yodeling", 6.21], ["singing", 3.53]], [["music", 80.88], ["humming", 5.7], ["carnatic music", 2.35]], null, null, null, null, [["music", 57.39], ["speech", 7.57], ["musical instrument", 5.0]]], "duration": [7.15, 1.06, 0.68, 1.3, 0.84, 0.56, 1.18, 1.08, 2.32, 1.39, 1.92, -0.1, 1.99, 2.55, 0.27, 0.61, 0.26, 0.68, 2.11, 4.85, 5.39, 5.59, 1.63, 1.68, 5.84, 1.43, 5.61, 16.84, 1.15, 2.17, 5.14, 5.62, 24.94]} \ No newline at end of file diff --git a/annotations_filtered/0L-Zqr0eyDg_filtered.json b/annotations_filtered/0L-Zqr0eyDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81d085e842a8580e0aa9373f4533802be3dcf265 --- /dev/null +++ b/annotations_filtered/0L-Zqr0eyDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.49]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.49]} \ No newline at end of file diff --git a/annotations_filtered/0L1sL54G45Q_filtered.json b/annotations_filtered/0L1sL54G45Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0788b1dd66c561087e9528c976554e22ddfa3e --- /dev/null +++ b/annotations_filtered/0L1sL54G45Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.12], [39.0, 46.55], [49.0, 124.71], [125.0, 125.74], [127.0, 127.01]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 36.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.56], ["theremin", 33.15], ["singing", 1.46]], null, null, null], "duration": [0.12, 7.55, 75.71, 0.74, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/0LArIo7OUJ8_filtered.json b/annotations_filtered/0LArIo7OUJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c77499edeeea83a13b17ac5f1212623f460cd3e --- /dev/null +++ b/annotations_filtered/0LArIo7OUJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 29.32], [32.0, 33.47], [43.0, 44.66], [46.0, 46.47], [49.0, 51.11], [58.0, 66.68], [69.0, 72.39], [74.0, 74.85], [81.0, 82.54], [83.0, 83.07], [87.0, 91.99], [93.0, 110.67], [113.0, 116.18], [116.0, 118.17], [119.0, 119.55], [120.0, 121.73], [123.0, 150.82], [151.0, 155.33], [156.0, 156.59]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [31.04, 0.0, 0.0, 0.0, 31.69, 30.74, 38.17, 0.0, 0.0, 0.0, 42.93, 29.62, 31.4, 28.71, 0.0, 0.0, 28.95, 30.55, 0.0], "audiomae_on_audioset": [[["music", 30.3], ["didgeridoo", 24.2], ["frog", 8.06]], null, null, null, [["didgeridoo", 61.78], ["music", 14.89], ["speech", 5.52]], [["music", 56.65], ["didgeridoo", 18.02], ["musical instrument", 4.49]], [["music", 66.86], ["didgeridoo", 14.6], ["hum", 2.23]], null, null, null, [["music", 67.28], ["didgeridoo", 8.33], ["hum", 2.14]], [["music", 38.29], ["didgeridoo", 14.36], ["speech", 7.32]], [["music", 23.12], ["foghorn", 12.47], ["didgeridoo", 8.53]], [["music", 58.06], ["theremin", 6.51], ["synthesizer", 3.88]], null, null, [["music", 89.26], ["didgeridoo", 2.28], ["musical instrument", 2.15]], [["music", 54.88], ["quack", 15.89], ["animal", 6.72]], null], "duration": [3.32, 1.47, 1.66, 0.47, 2.11, 8.68, 3.39, 0.85, 1.54, 0.07, 4.99, 17.67, 3.18, 2.17, 0.55, 1.73, 27.82, 4.33, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/0LzZVYshI7s_filtered.json b/annotations_filtered/0LzZVYshI7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da76032f7814f8163d549d681c9b92aeb21c778a --- /dev/null +++ b/annotations_filtered/0LzZVYshI7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.71], [16.0, 18.93], [19.0, 20.73], [22.0, 22.47], [24.0, 25.12], [26.0, 26.82], [28.0, 29.05], [31.0, 34.96], [36.0, 36.22], [41.0, 41.15], [49.0, 48.76], [54.0, 53.76], [59.0, 58.82], [67.0, 87.71], [88.0, 89.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 2.93, 1.73, 0.47, 1.12, 0.82, 1.05, 3.96, 0.22, 0.15, -0.24, -0.24, -0.18, 20.71, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/0MHIzgCZcxc_filtered.json b/annotations_filtered/0MHIzgCZcxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a0b5876cd21021d0516012b831c0eb599c7dd22 --- /dev/null +++ b/annotations_filtered/0MHIzgCZcxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.23], [13.0, 13.78], [22.0, 21.98], [28.0, 30.72], [32.0, 32.71], [35.0, 41.37], [43.0, 43.24], [51.0, 51.92], [57.0, 58.21], [60.0, 69.96], [71.0, 72.27], [73.0, 73.94], [78.0, 80.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.97, 0.0, 94.81, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.78, -0.02, 2.72, 0.71, 6.37, 0.24, 0.92, 1.21, 9.96, 1.27, 0.94, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/0MUWDGcRCOQ_filtered.json b/annotations_filtered/0MUWDGcRCOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf9a2794c1286f53680857ea830450cf6e42340 --- /dev/null +++ b/annotations_filtered/0MUWDGcRCOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [2.0, 2.61], [4.0, 3.81], [5.0, 6.91], [9.0, 9.17], [17.0, 27.31], [28.0, 32.56], [33.0, 35.8], [36.0, 36.88], [38.0, 41.39], [43.0, 43.07], [44.0, 44.69], [45.0, 45.66], [46.0, 51.09], [52.0, 53.01], [54.0, 55.04], [56.0, 56.2], [57.0, 58.08], [59.0, 59.26], [60.0, 60.29], [67.0, 67.71], [68.0, 70.26], [72.0, 73.52], [74.0, 74.88], [76.0, 78.92], [80.0, 96.53], [98.0, 100.45], [101.0, 103.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 99.36, 0.0, 99.31, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 91.13, 72.31, 99.96, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 0.61, -0.19, 1.91, 0.17, 10.31, 4.56, 2.8, 0.88, 3.39, 0.07, 0.69, 0.66, 5.09, 1.01, 1.04, 0.2, 1.08, 0.26, 0.29, 0.71, 2.26, 1.52, 0.88, 2.92, 16.53, 2.45, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/0MU_p9wU5kQ_filtered.json b/annotations_filtered/0MU_p9wU5kQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c4a5ad5655aa84e632768c892d3e6791835f54d --- /dev/null +++ b/annotations_filtered/0MU_p9wU5kQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.33], [29.0, 38.26], [41.0, 45.23], [46.0, 54.77], [56.0, 56.54], [61.0, 62.48], [64.0, 66.38], [71.0, 72.12], [82.0, 84.4], [84.0, 85.65], [90.0, 91.08], [94.0, 95.74], [103.0, 103.23], [106.0, 107.55], [111.0, 111.47], [112.0, 112.46], [113.0, 114.74], [115.0, 116.83], [118.0, 118.08], [118.0, 118.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.48, 100.0, 70.86, 0.0, 0.0, 100.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.33, 9.26, 4.23, 8.77, 0.54, 1.48, 2.38, 1.12, 2.4, 1.65, 1.08, 1.74, 0.23, 1.55, 0.47, 0.46, 1.74, 1.83, 0.08, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/0MoJuaS5x14_filtered.json b/annotations_filtered/0MoJuaS5x14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93f1a628348b1ebeed071f67173e717b57543f33 --- /dev/null +++ b/annotations_filtered/0MoJuaS5x14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.18], [17.0, 26.7], [31.0, 32.76], [35.0, 35.21], [37.0, 41.55], [47.0, 48.52], [50.0, 51.06], [53.0, 84.96], [85.0, 86.98], [88.0, 88.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.07, 36.15, 0.0, 0.0, 34.48, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.27], ["theremin", 7.47], ["hum", 6.07]], null, null, [["music", 66.33], ["drum machine", 8.14], ["synthesizer", 6.14]], null, null, null, null, null], "duration": [3.18, 9.7, 1.76, 0.21, 4.55, 1.52, 1.06, 31.96, 1.98, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/0N-cvihnyqg_filtered.json b/annotations_filtered/0N-cvihnyqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbe47c26a064f6915d04f9158bf2ae9f3aa6a26 --- /dev/null +++ b/annotations_filtered/0N-cvihnyqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [6.0, 5.76], [7.0, 7.4], [11.0, 12.33], [19.0, 18.79], [21.0, 21.1], [23.0, 23.67], [29.0, 30.55], [32.0, 33.78], [35.0, 37.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 65.46], ["caw", 5.8], ["sidetone", 5.04]]], "duration": [-0.08, -0.24, 0.4, 1.33, -0.21, 0.1, 0.67, 1.55, 1.78, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/0N7ilB9wX3o_filtered.json b/annotations_filtered/0N7ilB9wX3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3a6c1b374a39a6a5fe0fdc9427c3efbc9718a80 --- /dev/null +++ b/annotations_filtered/0N7ilB9wX3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [18.0, 18.1], [31.0, 31.53], [32.0, 32.68], [43.0, 42.79], [51.0, 51.71], [69.0, 69.58], [76.0, 76.03], [85.0, 87.2], [113.0, 114.07], [116.0, 116.88], [122.0, 122.22], [127.0, 128.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 78.33], ["speech", 2.9], ["musical instrument", 1.96]], null, null, null, null], "duration": [0.73, 0.1, 0.53, 0.68, -0.21, 0.71, 0.58, 0.03, 2.2, 1.07, 0.88, 0.22, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/0N9Fzv7bYCM_filtered.json b/annotations_filtered/0N9Fzv7bYCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2849b2aa824aa75f09950d052b931a284e013d4c --- /dev/null +++ b/annotations_filtered/0N9Fzv7bYCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.54], [16.0, 17.78], [24.0, 31.38], [33.0, 33.64], [34.0, 34.5], [38.0, 38.62], [47.0, 47.46], [52.0, 54.58], [56.0, 57.45], [60.0, 60.44], [62.0, 62.9], [66.0, 77.38], [79.0, 80.37], [81.0, 81.53], [97.0, 97.93], [102.0, 103.91], [104.0, 104.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [90.08, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.04], ["hum", 14.4], ["music", 8.42]], null, null, null, null, null], "duration": [4.54, 1.78, 7.38, 0.64, 0.5, 0.62, 0.46, 2.58, 1.45, 0.44, 0.9, 11.38, 1.37, 0.53, 0.93, 1.91, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/0NHFYpXhiiY_filtered.json b/annotations_filtered/0NHFYpXhiiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..906d8ded1a71dea6a82e74d4d35b9c8c55040551 --- /dev/null +++ b/annotations_filtered/0NHFYpXhiiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.46], [24.0, 25.83], [28.0, 45.89], [51.0, 58.51], [59.0, 68.74], [69.0, 70.75], [71.0, 71.51], [72.0, 72.57], [73.0, 72.62], [73.0, 77.82], [79.0, 80.01], [80.0, 86.0], [88.0, 92.4], [93.0, 96.06], [104.0, 114.71], [116.0, 119.2], [121.0, 123.36], [125.0, 127.53], [129.0, 153.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.17, 0.0, 30.92, 32.23, 72.01, 0.0, 0.0, 0.0, 0.0, 59.07, 0.0, 78.21, 39.07, 84.8, 48.87, 53.1, 93.6, 97.33, 38.36], "audiomae_on_audioset": [[["hum", 30.16], ["mains hum", 29.3], ["music", 14.98]], null, [["music", 46.06], ["hum", 15.32], ["speech", 12.95]], [["speech", 51.06], ["music", 18.07], ["thump, thud", 5.04]], null, null, null, null, null, null, null, null, [["music", 35.0], ["speech", 29.06], ["whale vocalization", 9.86]], null, [["music", 82.36], ["hum", 3.77], ["scary music", 3.52]], null, null, null, [["breaking", 22.86], ["speech", 22.17], ["music", 18.34]]], "duration": [9.46, 1.83, 17.89, 7.51, 9.74, 1.75, 0.51, 0.57, -0.38, 4.82, 1.01, 6.0, 4.4, 3.06, 10.71, 3.2, 2.36, 2.53, 24.81]} \ No newline at end of file diff --git a/annotations_filtered/0NNaypyly_o_filtered.json b/annotations_filtered/0NNaypyly_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..447c87a47c54de35d497c27d24aac1c50efa7c9b --- /dev/null +++ b/annotations_filtered/0NNaypyly_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.2], [16.0, 20.8], [22.0, 22.6]], "keep_status": [false, false, false], "silence_prob": [0.0, 58.55, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.2, 4.8, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/0NSgeb0dBLY_filtered.json b/annotations_filtered/0NSgeb0dBLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..095c5ad81b1f6777f0159c550131a8fe97c0fdbf --- /dev/null +++ b/annotations_filtered/0NSgeb0dBLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.71], [18.0, 18.3], [19.0, 21.03], [27.0, 27.77], [32.0, 34.96], [36.0, 37.12], [38.0, 39.7], [42.0, 43.19], [45.0, 45.5], [47.0, 48.17], [49.0, 51.31], [55.0, 66.58], [67.0, 71.79], [72.0, 73.68], [74.0, 75.63], [77.0, 79.27], [80.0, 80.54], [81.0, 84.21], [88.0, 101.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.67, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 34.08, 30.88, 0.0, 0.0, 82.43, 0.0, 88.1, 35.16], "audiomae_on_audioset": [null, null, null, null, [["speech", 80.68], ["radio", 4.93], ["telephone", 3.21]], null, null, null, null, null, null, [["music", 56.49], ["electronic music", 4.39], ["sheep", 3.2]], [["speech", 34.92], ["music", 17.71], ["tuning fork", 9.9]], null, null, null, null, null, [["music", 61.35], ["electronic music", 10.68], ["drum machine", 3.32]]], "duration": [0.71, 0.3, 2.03, 0.77, 2.96, 1.12, 1.7, 1.19, 0.5, 1.17, 2.31, 11.58, 4.79, 1.68, 1.63, 2.27, 0.54, 3.21, 13.44]} \ No newline at end of file diff --git a/annotations_filtered/0NUDP-gxGyM_filtered.json b/annotations_filtered/0NUDP-gxGyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e3d4a99da7e2b5d4ee6b9c4b470b7b2171ced1f --- /dev/null +++ b/annotations_filtered/0NUDP-gxGyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.07], [11.0, 11.8], [13.0, 13.85], [17.0, 17.59], [20.0, 20.8], [21.0, 23.08], [26.0, 27.68], [31.0, 32.51], [33.0, 35.94], [37.0, 39.77], [42.0, 43.17], [52.0, 55.93], [59.0, 59.17], [64.0, 64.76], [67.0, 68.35], [73.0, 75.29], [76.0, 78.02], [80.0, 80.2], [87.0, 91.03], [94.0, 98.31], [99.0, 102.59], [104.0, 105.0], [105.0, 106.15], [110.0, 123.82], [124.0, 129.86], [130.0, 137.51], [141.0, 147.99], [150.0, 150.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 99.94, 100.0, 0.0, 51.5, 0.0, 0.0, 0.0, 54.9, 98.59, 0.0, 99.73, 99.93, 99.99, 0.0, 0.0, 84.98, 74.13, 49.97, 44.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.14], ["hum", 26.47], ["throbbing", 12.16]], [["fly, housefly", 21.39], ["hum", 11.31], ["fart", 10.99]], null], "duration": [1.07, 0.8, 0.85, 0.59, 0.8, 2.08, 1.68, 1.51, 2.94, 2.77, 1.17, 3.93, 0.17, 0.76, 1.35, 2.29, 2.02, 0.2, 4.03, 4.31, 3.59, 1.0, 1.15, 13.82, 5.86, 7.51, 6.99, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/0NXkZZqCGjs_filtered.json b/annotations_filtered/0NXkZZqCGjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..548331b3efb78a3683b671dff676417cbb1bca75 --- /dev/null +++ b/annotations_filtered/0NXkZZqCGjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.82], [29.0, 29.93], [39.0, 93.7], [94.0, 102.0], [105.0, 108.24], [111.0, 121.47]], "keep_status": [true, false, false, true, true, false], "silence_prob": [35.37, 0.0, 0.0, 33.23, 33.65, 33.19], "audiomae_on_audioset": [[["speech", 25.15], ["vehicle", 16.68], ["car", 8.78]], null, null, [["speech", 41.49], ["vehicle", 8.64], ["buzz", 5.27]], [["music", 30.74], ["speech", 13.7], ["whale vocalization", 9.0]], [["music", 77.4], ["buzz", 2.7], ["didgeridoo", 2.43]]], "duration": [2.82, 0.93, 54.7, 8.0, 3.24, 10.47]} \ No newline at end of file diff --git a/annotations_filtered/0Nn_t_RfYS8_filtered.json b/annotations_filtered/0Nn_t_RfYS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..788e0e0f9c846549e167dbb3c19f39017d78bc14 --- /dev/null +++ b/annotations_filtered/0Nn_t_RfYS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.88], [16.0, 20.8], [25.0, 31.06], [35.0, 39.72], [42.0, 54.31], [60.0, 61.08], [70.0, 71.04], [73.0, 73.85], [75.0, 75.3], [76.0, 76.38], [78.0, 78.85], [80.0, 81.7], [84.0, 84.47], [87.0, 87.99], [88.0, 90.26], [92.0, 92.67], [93.0, 102.1], [103.0, 104.03], [104.0, 105.0], [106.0, 108.92], [110.0, 111.1], [126.0, 126.22]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.36, 37.3, 38.7, 39.19, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 96.77, 0.0, 0.0, 99.87, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.09], ["trombone", 8.22], ["speech", 7.39]], [["music", 33.68], ["trombone", 20.23], ["brass instrument", 10.64]], [["music", 57.12], ["trombone", 6.99], ["brass instrument", 5.44]], [["music", 40.01], ["foghorn", 13.72], ["trombone", 10.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.88, 4.8, 6.06, 4.72, 12.31, 1.08, 1.04, 0.85, 0.3, 0.38, 0.85, 1.7, 0.47, 0.99, 2.26, 0.67, 9.1, 1.03, 1.0, 2.92, 1.1, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/0O5CcvLk-uE_filtered.json b/annotations_filtered/0O5CcvLk-uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0O5CcvLk-uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0OKdy3Hpzp8_filtered.json b/annotations_filtered/0OKdy3Hpzp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b07c5eb8f84bd091a152e2fc8a58c04401ac5134 --- /dev/null +++ b/annotations_filtered/0OKdy3Hpzp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.59], [8.0, 9.04], [11.0, 11.37], [16.0, 17.14], [18.0, 19.65], [23.0, 23.92], [26.0, 27.68], [29.0, 30.03], [34.0, 34.5], [36.0, 36.95], [39.0, 39.61], [40.0, 40.56], [41.0, 43.31], [44.0, 45.32], [46.0, 46.11], [47.0, 46.92], [49.0, 49.3], [49.0, 49.6], [53.0, 55.43], [60.0, 60.59], [61.0, 63.02], [64.0, 64.07], [64.0, 64.56], [65.0, 65.37], [67.0, 67.46], [73.0, 73.97], [77.0, 78.16], [80.0, 80.55], [81.0, 83.34], [85.0, 86.61], [90.0, 91.03], [96.0, 97.71], [102.0, 101.9], [103.0, 104.01], [107.0, 108.33], [110.0, 112.56], [114.0, 113.76], [115.0, 115.65], [121.0, 122.0], [126.0, 126.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.96, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 1.04, 0.37, 1.14, 1.65, 0.92, 1.68, 1.03, 0.5, 0.95, 0.61, 0.56, 2.31, 1.32, 0.11, -0.08, 0.3, 0.6, 2.43, 0.59, 2.02, 0.07, 0.56, 0.37, 0.46, 0.97, 1.16, 0.55, 2.34, 1.61, 1.03, 1.71, -0.1, 1.01, 1.33, 2.56, -0.24, 0.65, 1.0, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/0ONU_H0EjIg_filtered.json b/annotations_filtered/0ONU_H0EjIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d696c82284b40c4a3689233ff99d4db922c48c3 --- /dev/null +++ b/annotations_filtered/0ONU_H0EjIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.62], [32.0, 35.16], [36.0, 38.91], [40.0, 40.74], [41.0, 43.7], [45.0, 48.0], [49.0, 54.67], [55.0, 56.05], [56.0, 57.03], [58.0, 59.56], [60.0, 60.74], [62.0, 62.63], [70.0, 71.04], [72.0, 73.45], [76.0, 77.04], [80.0, 81.24], [83.0, 85.21], [86.0, 88.96], [90.0, 91.94], [96.0, 97.34], [99.0, 100.4], [104.0, 105.41], [106.0, 107.76], [109.0, 117.05], [118.0, 119.82], [120.0, 123.23], [125.0, 126.79], [128.0, 130.87], [134.0, 135.3], [138.0, 139.67], [141.0, 142.03], [143.0, 147.87], [149.0, 151.07], [152.0, 156.22], [157.0, 157.62], [159.0, 161.67], [163.0, 164.25], [165.0, 169.45], [170.0, 175.15], [178.0, 181.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 87.55, 99.99, 0.0, 80.46, 80.64, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 55.31, 0.0, 98.93, 0.0, 0.0, 0.0, 99.92, 83.16, 42.04, 0.0, 98.73, 0.0, 81.0, 90.6, 92.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.12], ["music", 23.32], ["sidetone", 14.23]], null, null, null, null, null, null], "duration": [1.62, 3.16, 2.91, 0.74, 2.7, 3.0, 5.67, 1.05, 1.03, 1.56, 0.74, 0.63, 1.04, 1.45, 1.04, 1.24, 2.21, 2.96, 1.94, 1.34, 1.4, 1.41, 1.76, 8.05, 1.82, 3.23, 1.79, 2.87, 1.3, 1.67, 1.03, 4.87, 2.07, 4.22, 0.62, 2.67, 1.25, 4.45, 5.15, 3.94]} \ No newline at end of file diff --git a/annotations_filtered/0P4h2-R9Rak_filtered.json b/annotations_filtered/0P4h2-R9Rak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09ab90e31976e969a4e22965232690dc4743d133 --- /dev/null +++ b/annotations_filtered/0P4h2-R9Rak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.85], [25.0, 32.0], [38.0, 41.44], [44.0, 45.89], [46.0, 47.73], [51.0, 52.08], [55.0, 83.35], [87.0, 91.56], [96.0, 96.6], [98.0, 101.36], [105.0, 105.29], [110.0, 110.32], [111.0, 111.47], [112.0, 112.5], [118.0, 117.95], [120.0, 120.7]], "keep_status": [true, true, true, false, false, false, true, true, false, true, false, false, false, false, false, false], "silence_prob": [30.62, 29.24, 29.84, 0.0, 0.0, 0.0, 29.37, 30.56, 0.0, 33.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.11], ["theremin", 14.02], ["foghorn", 8.04]], [["music", 36.37], ["musical instrument", 6.5], ["foghorn", 6.4]], [["foghorn", 34.08], ["music", 19.37], ["musical instrument", 7.34]], null, null, null, [["whack, thwack", 34.7], ["music", 20.4], ["speech", 6.59]], [["music", 18.59], ["fly, housefly", 17.68], ["mosquito", 16.54]], null, [["music", 27.19], ["throbbing", 9.12], ["speech", 8.95]], null, null, null, null, null, null], "duration": [2.85, 7.0, 3.44, 1.89, 1.73, 1.08, 28.35, 4.56, 0.6, 3.36, 0.29, 0.32, 0.47, 0.5, -0.05, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/0PCcz5_8IEI_filtered.json b/annotations_filtered/0PCcz5_8IEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f4bf13ab4d1bc94062d7aff32abeacc87fa5673 --- /dev/null +++ b/annotations_filtered/0PCcz5_8IEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.29], [14.0, 31.41], [31.0, 31.45], [32.0, 38.96], [42.0, 70.29], [72.0, 82.43], [83.0, 91.71], [95.0, 98.17], [99.0, 101.19], [101.0, 102.25], [106.0, 115.91], [120.0, 124.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.92, 0.0, 96.77, 96.42, 89.19, 68.28, 58.98, 58.38, 0.0, 54.56, 67.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 17.41, 0.45, 6.96, 28.29, 10.43, 8.71, 3.17, 2.19, 1.25, 9.91, 4.7]} \ No newline at end of file diff --git a/annotations_filtered/0PIbNyzb5YM_filtered.json b/annotations_filtered/0PIbNyzb5YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..790f1374f2b54a2eb7e768258ff1d4182a5ecef3 --- /dev/null +++ b/annotations_filtered/0PIbNyzb5YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.13], [15.0, 16.55], [22.0, 22.5], [24.0, 25.98], [31.0, 39.65], [53.0, 53.94], [57.0, 71.0], [72.0, 72.33], [73.0, 77.25], [81.0, 81.35], [91.0, 91.71]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [48.65, 0.0, 0.0, 0.0, 37.22, 0.0, 32.38, 0.0, 73.67, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 25.3], ["mains hum", 19.06], ["speech", 18.65]], null, null, null, [["speech", 40.53], ["hum", 17.19], ["music", 9.08]], null, [["music", 27.3], ["speech", 22.22], ["hum", 9.74]], null, null, null, null], "duration": [9.13, 1.55, 0.5, 1.98, 8.65, 0.94, 14.0, 0.33, 4.25, 0.35, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/0PdeHy_87OM_filtered.json b/annotations_filtered/0PdeHy_87OM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28ca845833d6cfa6b3e2443e83c9eacbdf47423f --- /dev/null +++ b/annotations_filtered/0PdeHy_87OM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.2], [8.0, 8.85], [9.0, 13.1], [27.0, 27.55], [29.0, 29.51], [33.0, 33.45], [60.0, 60.78], [65.0, 65.52], [66.0, 67.0], [68.0, 68.57], [69.0, 69.96], [80.0, 81.26], [95.0, 95.17], [99.0, 100.53], [103.0, 104.33], [128.0, 129.93], [138.0, 139.24], [140.0, 140.39], [145.0, 145.4], [149.0, 149.0], [149.0, 151.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.53, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.2, 0.85, 4.1, 0.55, 0.51, 0.45, 0.78, 0.52, 1.0, 0.57, 0.96, 1.26, 0.17, 1.53, 1.33, 1.93, 1.24, 0.39, 0.4, 0.0, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/0PraJ0mNgUs_filtered.json b/annotations_filtered/0PraJ0mNgUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ccaabcfcd90be5e95c967519edbd2f19329e07 --- /dev/null +++ b/annotations_filtered/0PraJ0mNgUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 48.86], [52.0, 61.96], [64.0, 65.74], [69.0, 68.67], [71.0, 72.03], [77.0, 77.92], [79.0, 80.18], [81.0, 82.09], [84.0, 85.23], [86.0, 88.82], [90.0, 93.19], [98.0, 98.15], [99.0, 107.28], [109.0, 111.64], [113.0, 116.23], [118.0, 120.18], [122.0, 130.99]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73, 75.55, 0.0, 68.28, 50.02, 52.33, 52.68, 79.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 30.44], ["speech", 29.72], ["singing bowl", 6.25]], null, null, null, null, null, null, null], "duration": [33.86, 9.96, 1.74, -0.33, 1.03, 0.92, 1.18, 1.09, 1.23, 2.82, 3.19, 0.15, 8.28, 2.64, 3.23, 2.18, 8.99]} \ No newline at end of file diff --git a/annotations_filtered/0PtKzdvq7bc_filtered.json b/annotations_filtered/0PtKzdvq7bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec390fe5a10d3d8fa680d2d903393f0cfad43ad2 --- /dev/null +++ b/annotations_filtered/0PtKzdvq7bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.66], [13.0, 14.03], [16.0, 26.03], [32.0, 35.19], [37.0, 38.06], [39.0, 40.85], [42.0, 42.74], [46.0, 46.99], [48.0, 49.89], [56.0, 65.16], [66.0, 67.91], [68.0, 68.89], [69.0, 70.53], [71.0, 71.31], [72.0, 73.08], [76.0, 78.46], [79.0, 80.0], [96.0, 98.63], [100.0, 101.7], [103.0, 103.76], [110.0, 110.74], [113.0, 114.18], [119.0, 120.06], [123.0, 122.93], [129.0, 130.17], [131.0, 133.79], [135.0, 136.76], [142.0, 142.92], [151.0, 155.51], [156.0, 157.76], [160.0, 162.73], [166.0, 167.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [87.92, 0.0, 44.07, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26, 0.0, 0.0, 29.71, 0.0, 42.69, 0.0], "audiomae_on_audioset": [null, null, [["speech", 86.64], ["animal", 2.22], ["crowd", 1.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.64], ["speech", 24.41], ["musical instrument", 4.68]], null, null, [["music", 23.59], ["whack, thwack", 6.17], ["chant", 4.64]], null, [["music", 44.18], ["didgeridoo", 23.28], ["musical instrument", 6.4]], null], "duration": [2.66, 1.03, 10.03, 3.19, 1.06, 1.85, 0.74, 0.99, 1.89, 9.16, 1.91, 0.89, 1.53, 0.31, 1.08, 2.46, 1.0, 2.63, 1.7, 0.76, 0.74, 1.18, 1.06, -0.07, 1.17, 2.79, 1.76, 0.92, 4.51, 1.76, 2.73, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/0QbMWpwr7FM_filtered.json b/annotations_filtered/0QbMWpwr7FM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..127f6366040d46b64dd6c42daff25cc7885380c7 --- /dev/null +++ b/annotations_filtered/0QbMWpwr7FM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.4], [31.0, 32.75], [34.0, 36.85], [41.0, 44.98], [48.0, 79.34], [80.0, 80.57], [81.0, 81.65], [82.0, 111.69]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 99.97, 0.0, 0.0, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.4, 1.75, 2.85, 3.98, 31.34, 0.57, 0.65, 29.69]} \ No newline at end of file diff --git a/annotations_filtered/0QeOXuuFo4g_filtered.json b/annotations_filtered/0QeOXuuFo4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daaf1de310c0d99a9c4aa74ac359a5ca0cd3877d --- /dev/null +++ b/annotations_filtered/0QeOXuuFo4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.02], [6.0, 7.01], [8.0, 8.83], [13.0, 13.02], [20.0, 20.66], [22.0, 22.15], [23.0, 24.16], [28.0, 28.04], [29.0, 28.76], [29.0, 29.37], [33.0, 33.99], [34.0, 38.35], [40.0, 40.95], [43.0, 43.83], [48.0, 48.22], [51.0, 51.36], [72.0, 72.94], [74.0, 74.85], [75.0, 76.08], [77.0, 77.52], [79.0, 79.1], [81.0, 81.72], [83.0, 83.15], [84.0, 85.26], [86.0, 86.7], [88.0, 99.96], [101.0, 104.6], [105.0, 105.41], [108.0, 108.35], [109.0, 109.26], [113.0, 113.56], [114.0, 114.47], [117.0, 116.99], [117.0, 123.09], [123.0, 125.19], [127.0, 127.52], [128.0, 128.85], [129.0, 129.46], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 71.57, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.13], ["sidetone", 16.56], ["inside, small room", 9.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 1.01, 0.83, 0.02, 0.66, 0.15, 1.16, 0.04, -0.24, 0.37, 0.99, 4.35, 0.95, 0.83, 0.22, 0.36, 0.94, 0.85, 1.08, 0.52, 0.1, 0.72, 0.15, 1.26, 0.7, 11.96, 3.6, 0.41, 0.35, 0.26, 0.56, 0.47, -0.01, 6.09, 2.19, 0.52, 0.85, 0.46, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/0Qkk8a1IVxQ_filtered.json b/annotations_filtered/0Qkk8a1IVxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec8a4c79ff055178b20f1cef524003f58124c66 --- /dev/null +++ b/annotations_filtered/0Qkk8a1IVxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [2.0, 10.3], [11.0, 17.78], [20.0, 24.8], [29.0, 34.92], [37.0, 43.77], [46.0, 52.71], [55.0, 60.37], [62.0, 94.04], [99.0, 102.44], [103.0, 104.99], [108.0, 113.61], [117.0, 120.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.39, 41.74, 34.56, 34.31, 35.18, 33.32, 32.81, 0.0, 34.53, 0.0, 32.68, 32.12], "audiomae_on_audioset": [null, [["music", 69.49], ["guitar", 6.89], ["effects unit", 5.43]], [["music", 61.74], ["effects unit", 10.74], ["guitar", 7.82]], [["music", 71.76], ["synthesizer", 3.94], ["effects unit", 3.82]], [["music", 69.37], ["effects unit", 6.11], ["guitar", 3.66]], [["music", 69.23], ["bass guitar", 6.39], ["guitar", 5.68]], [["music", 67.61], ["didgeridoo", 7.38], ["musical instrument", 3.57]], [["music", 61.74], ["guitar", 11.01], ["plucked string instrument", 6.72]], null, [["music", 75.93], ["throbbing", 2.79], ["musical instrument", 2.71]], null, [["music", 62.15], ["throbbing", 15.86], ["musical instrument", 2.14]], [["music", 40.85], ["speech", 7.23], ["throbbing", 5.44]]], "duration": [0.41, 8.3, 6.78, 4.8, 5.92, 6.77, 6.71, 5.37, 32.04, 3.44, 1.99, 5.61, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/0QoGNA_9zqQ_filtered.json b/annotations_filtered/0QoGNA_9zqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9b802c2e94564879a386fda79e2bfe9990e4f7d --- /dev/null +++ b/annotations_filtered/0QoGNA_9zqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.15], [36.0, 39.02], [40.0, 55.0], [56.0, 58.21], [65.0, 65.23], [66.0, 69.74], [70.0, 71.74], [72.0, 72.86], [74.0, 74.66], [81.0, 81.85], [82.0, 84.55], [89.0, 97.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 100.0, 95.51, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 97.43, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 3.02, 15.0, 2.21, 0.23, 3.74, 1.74, 0.86, 0.66, 0.85, 2.55, 8.17]} \ No newline at end of file diff --git a/annotations_filtered/0REROw4SOGc_filtered.json b/annotations_filtered/0REROw4SOGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e85d29168b1df5e76f0cfdb9a55d441184f3c498 --- /dev/null +++ b/annotations_filtered/0REROw4SOGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.78], [4.0, 4.29], [7.0, 7.89], [9.0, 9.58], [12.0, 12.04], [13.0, 15.94], [20.0, 20.12], [29.0, 29.86], [31.0, 31.82], [32.0, 33.86], [35.0, 36.21], [39.0, 39.77], [42.0, 42.42], [45.0, 46.23], [47.0, 48.0], [49.0, 49.92], [51.0, 52.3], [55.0, 56.25], [61.0, 61.62], [65.0, 65.74], [67.0, 67.17], [68.0, 67.88], [69.0, 69.65], [70.0, 70.87], [72.0, 72.76], [74.0, 74.6], [76.0, 76.76], [78.0, 78.48], [80.0, 80.33], [82.0, 82.17], [84.0, 84.75], [85.0, 86.48], [88.0, 92.38], [93.0, 94.46], [95.0, 96.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 0.29, 0.89, 0.58, 0.04, 2.94, 0.12, 0.86, 0.82, 1.86, 1.21, 0.77, 0.42, 1.23, 1.0, 0.92, 1.3, 1.25, 0.62, 0.74, 0.17, -0.12, 0.65, 0.87, 0.76, 0.6, 0.76, 0.48, 0.33, 0.17, 0.75, 1.48, 4.38, 1.46, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/0RM_Ehtb5C4_filtered.json b/annotations_filtered/0RM_Ehtb5C4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b4ae52f89b49b31b36e8725202f20839d712689 --- /dev/null +++ b/annotations_filtered/0RM_Ehtb5C4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.14], [20.0, 23.82], [24.0, 27.09], [33.0, 33.05], [34.0, 35.92], [39.0, 42.25], [43.0, 55.51], [56.0, 56.54], [57.0, 71.19], [72.0, 72.67], [74.0, 79.1], [79.0, 80.25], [81.0, 81.3]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.2, 87.55, 52.1, 0.0, 0.0, 73.67, 51.18, 0.0, 51.28, 0.0, 57.48, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.73], ["cat", 8.14], ["animal", 7.64]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.14, 3.82, 3.09, 0.05, 1.92, 3.25, 12.51, 0.54, 14.19, 0.67, 5.1, 1.25, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/0ROplAtLJvo_filtered.json b/annotations_filtered/0ROplAtLJvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4851fdceb566526e940368f83f6659de715e075c --- /dev/null +++ b/annotations_filtered/0ROplAtLJvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [10.0, 10.77], [14.0, 14.99], [19.0, 19.09], [22.0, 22.3], [26.0, 28.93], [30.0, 32.59], [35.0, 36.39], [47.0, 49.74], [53.0, 53.77], [60.0, 64.72], [67.0, 68.81], [72.0, 73.25], [75.0, 75.02], [76.0, 79.17], [81.0, 81.4], [92.0, 92.97], [96.0, 96.58], [99.0, 100.62], [102.0, 103.6], [109.0, 110.39], [113.0, 117.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [56.1, 0.0, 0.0, 0.0, 0.0, 56.7, 54.9, 0.0, 55.31, 0.0, 51.88, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.13], ["rumble", 12.35], ["sine wave", 11.02]], null, null, null, null, null, null, null], "duration": [2.66, 0.77, 0.99, 0.09, 0.3, 2.93, 2.59, 1.39, 2.74, 0.77, 4.72, 1.81, 1.25, 0.02, 3.17, 0.4, 0.97, 0.58, 1.62, 1.6, 1.39, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/0RWk0XTaEX4_filtered.json b/annotations_filtered/0RWk0XTaEX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56d9f0c5000bed1eec9b346a377cef93e0161824 --- /dev/null +++ b/annotations_filtered/0RWk0XTaEX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [5.0, 4.73], [12.0, 13.26], [15.0, 17.04], [19.0, 19.63], [21.0, 21.27], [24.0, 24.06], [31.0, 31.23], [32.0, 37.81], [39.0, 41.08], [42.0, 42.77], [44.0, 45.59], [50.0, 51.44], [56.0, 58.51], [60.0, 62.06], [63.0, 63.12], [71.0, 71.54], [74.0, 77.28], [86.0, 116.6], [117.0, 118.22], [120.0, 120.97], [124.0, 124.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 90.78, 73.06, 0.0, 0.0, 0.0, 32.49, 32.3, 0.0, 0.0, 35.43, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 17.82], ["hum", 13.14], ["music", 12.88]], [["music", 35.69], ["didgeridoo", 8.92], ["musical instrument", 7.47]], null, null, [["creak", 20.75], ["speech", 9.78], ["fly, housefly", 9.72]], null, null, null, null], "duration": [0.19, -0.27, 1.26, 2.04, 0.63, 0.27, 0.06, 0.23, 5.81, 2.08, 0.77, 1.59, 1.44, 2.51, 2.06, 0.12, 0.54, 3.28, 30.6, 1.22, 0.97, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/0Rl9Cxc7uZA_filtered.json b/annotations_filtered/0Rl9Cxc7uZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4ade3cc013b62f0eb0dfbaf8d0e7fc5ad94b249 --- /dev/null +++ b/annotations_filtered/0Rl9Cxc7uZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.79], [16.0, 18.22], [20.0, 20.63], [23.0, 25.93], [30.0, 32.09], [42.0, 43.78], [45.0, 46.6], [48.0, 51.11], [52.0, 57.47], [60.0, 61.84], [63.0, 63.63], [68.0, 68.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.23, 0.0, 91.81, 89.9, 0.0, 0.0, 65.2, 71.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.79, 2.22, 0.63, 2.93, 2.09, 1.78, 1.6, 3.11, 5.47, 1.84, 0.63, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/0RlJNtKi_Pc_filtered.json b/annotations_filtered/0RlJNtKi_Pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa793e3d1b1b556bc682cac3199f67e91e334027 --- /dev/null +++ b/annotations_filtered/0RlJNtKi_Pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.8], [31.0, 32.49], [33.0, 33.47]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.8, 1.49, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/0S7olzuojGY_filtered.json b/annotations_filtered/0S7olzuojGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d3a3a7365c423c9f775dcc50739861fd64e8fb1 --- /dev/null +++ b/annotations_filtered/0S7olzuojGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.27], [4.0, 5.37], [14.0, 15.89], [17.0, 17.24], [20.0, 21.49], [28.0, 28.38], [32.0, 34.64], [36.0, 36.85], [40.0, 41.67], [58.0, 57.87], [59.0, 61.26], [64.0, 64.76], [66.0, 66.87], [69.0, 70.09], [71.0, 73.01], [74.0, 77.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 0.0, 76.04, 82.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 1.37, 1.89, 0.24, 1.49, 0.38, 2.64, 0.85, 1.67, -0.13, 2.26, 0.76, 0.87, 1.09, 2.01, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/0SDvqDdbhSc_filtered.json b/annotations_filtered/0SDvqDdbhSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90c0e8f91178346e146fec12e2e160482cacdbc6 --- /dev/null +++ b/annotations_filtered/0SDvqDdbhSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.12], [17.0, 22.94], [23.0, 27.94], [29.0, 31.45], [32.0, 44.58], [47.0, 48.57], [50.0, 58.06], [59.0, 69.01], [70.0, 73.36], [75.0, 77.21], [78.0, 90.46], [93.0, 107.23], [108.0, 114.22], [114.0, 127.5], [129.0, 131.38], [132.0, 133.88], [135.0, 151.33], [152.0, 154.18], [155.0, 155.22], [157.0, 157.99], [159.0, 160.66]], "keep_status": [true, true, false, true, false, false, false, false, true, true, true, true, false, true, false, false, false, false, false, false, false], "silence_prob": [40.41, 45.85, 55.25, 30.63, 29.69, 0.0, 45.18, 29.46, 39.11, 43.61, 32.21, 39.67, 41.46, 32.17, 46.75, 0.0, 33.15, 52.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 12.31], ["whale vocalization", 9.22], ["sheep", 8.69]], [["buzz", 17.3], ["livestock, farm animals, working animals", 15.74], ["moo", 12.34]], null, [["hum", 22.63], ["mains hum", 22.53], ["music", 20.9]], [["music", 71.5], ["boing", 4.45], ["didgeridoo", 2.42]], null, [["hum", 41.5], ["mains hum", 20.68], ["music", 15.19]], [["hum", 41.94], ["mains hum", 31.9], ["music", 16.77]], [["music", 27.79], ["throbbing", 23.45], ["hum", 13.76]], [["music", 42.99], ["hum", 7.35], ["ambient music", 6.56]], [["music", 25.6], ["hum", 15.73], ["gong", 9.75]], [["hum", 24.52], ["music", 23.91], ["mains hum", 12.37]], [["music", 56.68], ["hum", 7.35], ["throbbing", 5.99]], [["hum", 37.41], ["mains hum", 21.29], ["music", 10.69]], [["music", 41.91], ["hum", 22.85], ["mains hum", 6.67]], null, [["music", 60.77], ["hum", 14.58], ["throbbing", 5.82]], null, null, null, null], "duration": [4.12, 5.94, 4.94, 2.45, 12.58, 1.57, 8.06, 10.01, 3.36, 2.21, 12.46, 14.23, 6.22, 13.5, 2.38, 1.88, 16.33, 2.18, 0.22, 0.99, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/0SHMCN-6-IM_filtered.json b/annotations_filtered/0SHMCN-6-IM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/0SHMCN-6-IM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/0SSgv8t0QbM_filtered.json b/annotations_filtered/0SSgv8t0QbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ecf19554498a961b7209b1bbf8f52b092ab37e3 --- /dev/null +++ b/annotations_filtered/0SSgv8t0QbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [4.0, 5.31], [6.0, 7.47], [8.0, 10.61], [12.0, 20.11], [21.0, 21.47], [22.0, 28.22], [29.0, 31.11], [36.0, 55.07], [57.0, 60.78], [64.0, 72.5], [73.0, 72.94], [75.0, 83.94], [86.0, 86.36], [87.0, 88.35], [90.0, 91.86], [93.0, 95.05], [100.0, 100.72], [104.0, 105.38], [111.0, 111.86], [114.0, 115.38], [118.0, 119.84], [127.0, 130.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.68, 0.0, 55.67, 72.9, 74.13, 51.34, 32.82, 0.0, 37.41, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 27.65], ["speech", 20.72], ["didgeridoo", 14.66]], null, [["music", 58.47], ["synthesizer", 8.47], ["ambient music", 3.34]], null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 1.31, 1.47, 2.61, 8.11, 0.47, 6.22, 2.11, 19.07, 3.78, 8.5, -0.06, 8.94, 0.36, 1.35, 1.86, 2.05, 0.72, 1.38, 0.86, 1.38, 1.84, 3.84]} \ No newline at end of file diff --git a/annotations_filtered/0SbVnjlPhjY_filtered.json b/annotations_filtered/0SbVnjlPhjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c35b159e6e5f6d141041220d0076c3ae94f36ebf --- /dev/null +++ b/annotations_filtered/0SbVnjlPhjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.32], [16.0, 17.04], [29.0, 30.79], [32.0, 33.83], [34.0, 34.91], [36.0, 36.53], [38.0, 38.97], [41.0, 41.01], [44.0, 44.66], [48.0, 48.47], [52.0, 53.22], [58.0, 58.46], [60.0, 61.08], [62.0, 61.94], [63.0, 63.22], [64.0, 65.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.04, 1.79, 1.83, 0.91, 0.53, 0.97, 0.01, 0.66, 0.47, 1.22, 0.46, 1.08, -0.06, 0.22, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/0ShWGyC408I_filtered.json b/annotations_filtered/0ShWGyC408I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7964f67870bb4ae6f59abb923c0556655634fbc --- /dev/null +++ b/annotations_filtered/0ShWGyC408I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.71], [18.0, 19.92], [27.0, 27.28], [28.0, 30.08], [36.0, 38.7], [47.0, 47.46], [50.0, 52.24], [58.0, 59.16], [60.0, 61.23], [63.0, 62.97], [65.0, 65.13], [67.0, 74.85], [76.0, 77.48], [81.0, 107.08], [108.0, 107.91], [111.0, 112.19], [113.0, 113.83], [114.0, 116.94], [118.0, 118.52], [119.0, 122.1], [123.0, 125.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 0.0, 99.44, 71.29, 0.0, 30.56, 0.0, 0.0, 0.0, 0.0, 30.71, 0.0, 32.93, 0.0, 0.0, 0.0, 66.63, 0.0, 99.95, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 63.93], ["music", 6.77], ["boing", 5.62]], null, null, null, null, [["speech", 79.84], ["music", 5.6], ["livestock, farm animals, working animals", 2.33]], null, [["speech", 37.44], ["groan", 33.85], ["screaming", 7.88]], null, null, null, null, null, null, null], "duration": [2.71, 1.92, 0.28, 2.08, 2.7, 0.46, 2.24, 1.16, 1.23, -0.03, 0.13, 7.85, 1.48, 26.08, -0.09, 1.19, 0.83, 2.94, 0.52, 3.1, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/0SwgAb1effg_filtered.json b/annotations_filtered/0SwgAb1effg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbe26b6008e2b181ccfb1e6607a8a7b5b62cc39e --- /dev/null +++ b/annotations_filtered/0SwgAb1effg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.76], [29.0, 32.7], [35.0, 36.73], [41.0, 42.67], [45.0, 46.89], [52.0, 69.96], [75.0, 92.97]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [48.87, 36.18, 0.0, 0.0, 0.0, 40.9, 32.01], "audiomae_on_audioset": [[["hum", 26.21], ["throbbing", 22.78], ["rumble", 5.57]], [["hum", 52.28], ["speech", 15.42], ["mains hum", 11.29]], null, null, null, [["music", 56.89], ["hum", 11.85], ["throbbing", 8.3]], [["music", 74.34], ["synthesizer", 3.06], ["ambient music", 2.57]]], "duration": [8.76, 3.7, 1.73, 1.67, 1.89, 17.96, 17.97]} \ No newline at end of file diff --git a/annotations_filtered/0T0QWPRBau4_filtered.json b/annotations_filtered/0T0QWPRBau4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f4f98467b6ca71ab4c53f62696c7c12f5a60124 --- /dev/null +++ b/annotations_filtered/0T0QWPRBau4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.24], [25.0, 25.41], [27.0, 60.93], [62.0, 69.01], [70.0, 71.83], [72.0, 73.36], [74.0, 75.15], [76.0, 91.66]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 0.0, 31.72], "audiomae_on_audioset": [null, null, null, [["music", 46.93], ["throbbing", 9.29], ["hum", 8.46]], null, null, null, [["music", 55.64], ["throbbing", 10.27], ["hum", 9.55]]], "duration": [1.24, 0.41, 33.93, 7.01, 1.83, 1.36, 1.15, 15.66]} \ No newline at end of file diff --git a/annotations_filtered/0T3hXtyuX0g_filtered.json b/annotations_filtered/0T3hXtyuX0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfc82828b1a1544e295e8947315fa8f2eaba9c12 --- /dev/null +++ b/annotations_filtered/0T3hXtyuX0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.79], [29.0, 29.27], [57.0, 61.25], [65.0, 65.48], [70.0, 77.26], [81.0, 81.7], [85.0, 86.97], [90.0, 93.26], [95.0, 96.01], [98.0, 98.37], [100.0, 104.55], [105.0, 104.62], [105.0, 104.7], [105.0, 104.9], [108.0, 108.09], [111.0, 111.35], [113.0, 113.71], [116.0, 118.27], [123.0, 123.01], [125.0, 125.47], [127.0, 127.99], [130.0, 130.81], [132.0, 132.46], [134.0, 134.52], [138.0, 138.3], [139.0, 139.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.51, 0.0, 77.03, 0.0, 0.0, 76.53, 0.0, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 26.3], ["throbbing", 13.81], ["mains hum", 11.66]], null, null, null, null, null, null, [["speech", 60.22], ["animal", 2.96], ["outside, rural or natural", 2.04]], null, null, null, null, null, null, null, null], "duration": [0.79, 0.27, 4.25, 0.48, 7.26, 0.7, 1.97, 3.26, 1.01, 0.37, 4.55, -0.38, -0.3, -0.1, 0.09, 0.35, 0.71, 2.27, 0.01, 0.47, 0.99, 0.81, 0.46, 0.52, 0.3, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/0TmugJo-c9Y_filtered.json b/annotations_filtered/0TmugJo-c9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39532d6b33ce41586f18fa7099e73ec9a78d201e --- /dev/null +++ b/annotations_filtered/0TmugJo-c9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.62], [18.0, 18.47], [24.0, 26.08], [30.0, 30.52], [32.0, 33.32], [37.0, 37.89], [38.0, 38.38], [39.0, 39.82], [51.0, 52.24], [62.0, 62.33], [64.0, 64.66], [67.0, 67.34], [69.0, 71.91], [76.0, 76.15], [77.0, 77.13], [82.0, 84.03], [87.0, 94.44], [95.0, 97.44], [98.0, 99.03], [112.0, 112.48], [135.0, 134.89], [138.0, 138.92], [140.0, 140.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 44.57, 99.76, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.25], ["sidetone", 8.45], ["busy signal", 8.13]], null, null, null, null, null, null, null], "duration": [1.62, 0.47, 2.08, 0.52, 1.32, 0.89, 0.38, 0.82, 1.24, 0.33, 0.66, 0.34, 2.91, 0.15, 0.13, 2.03, 7.44, 2.44, 1.03, 0.48, -0.11, 0.92, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/0Tv6PQbWvJA_filtered.json b/annotations_filtered/0Tv6PQbWvJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bc96bf1e213b31dd3545cf30cb557809420405 --- /dev/null +++ b/annotations_filtered/0Tv6PQbWvJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.14], [11.0, 14.32], [24.0, 24.56], [29.0, 29.74], [31.0, 31.63], [34.0, 40.15], [40.0, 40.27], [41.0, 46.03], [48.0, 59.36], [63.0, 63.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.64, 0.0, 0.0, 0.0, 88.64, 0.0, 97.83, 78.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 3.32, 0.56, 0.74, 0.63, 6.15, 0.27, 5.03, 11.36, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/0TvKsVxgbF4_filtered.json b/annotations_filtered/0TvKsVxgbF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa1af8e23ea62a5f9d56c61c1b6fd36dbfdab41 --- /dev/null +++ b/annotations_filtered/0TvKsVxgbF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.36], [11.0, 12.31], [13.0, 14.23], [15.0, 20.58], [21.0, 25.39], [29.0, 35.13], [38.0, 51.39], [52.0, 60.98], [62.0, 108.63], [113.0, 114.12], [120.0, 120.88], [125.0, 126.45], [127.0, 133.25], [135.0, 136.44], [140.0, 141.94], [143.0, 144.44], [146.0, 146.8], [147.0, 149.96], [151.0, 152.83], [158.0, 158.82], [159.0, 168.22]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [32.23, 0.0, 0.0, 45.92, 28.47, 42.11, 30.86, 38.67, 0.0, 0.0, 0.0, 0.0, 32.39, 0.0, 0.0, 0.0, 0.0, 42.37, 0.0, 0.0, 38.5], "audiomae_on_audioset": [[["speech", 42.97], ["music", 33.81], ["didgeridoo", 3.75]], null, null, [["music", 57.48], ["foghorn", 4.31], ["hum", 3.57]], [["music", 42.37], ["livestock, farm animals, working animals", 7.83], ["cattle, bovinae", 6.22]], [["music", 60.32], ["didgeridoo", 4.97], ["speech", 4.56]], [["music", 59.86], ["gong", 8.89], ["electronic music", 4.22]], [["music", 41.08], ["mains hum", 17.31], ["hum", 16.98]], null, null, null, null, [["hum", 31.87], ["breaking", 14.0], ["music", 10.52]], null, null, null, null, [["music", 20.11], ["groan", 4.94], ["whale vocalization", 4.86]], null, null, [["music", 52.89], ["scary music", 34.76], ["speech", 7.86]]], "duration": [2.36, 1.31, 1.23, 5.58, 4.39, 6.13, 13.39, 8.98, 46.63, 1.12, 0.88, 1.45, 6.25, 1.44, 1.94, 1.44, 0.8, 2.96, 1.83, 0.82, 9.22]} \ No newline at end of file diff --git a/annotations_filtered/0U-kaLEaThU_filtered.json b/annotations_filtered/0U-kaLEaThU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78cc4c4443f7c73be85ec2ea9f3835e0f4f28c24 --- /dev/null +++ b/annotations_filtered/0U-kaLEaThU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.67], [17.0, 35.78], [37.0, 38.37], [41.0, 43.65], [48.0, 50.5], [52.0, 51.87], [53.0, 55.22], [57.0, 58.95], [60.0, 62.36], [63.0, 65.55], [69.0, 70.95], [72.0, 73.55], [75.0, 77.08], [78.0, 80.72], [82.0, 84.06], [85.0, 86.73], [87.0, 93.51], [97.0, 101.07], [104.0, 106.24], [108.0, 113.21], [115.0, 120.5], [121.0, 127.03], [129.0, 153.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 99.96, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 99.05, 100.0, 100.0, 100.0, 95.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.67, 18.78, 1.37, 2.65, 2.5, -0.13, 2.22, 1.95, 2.36, 2.55, 1.95, 1.55, 2.08, 2.72, 2.06, 1.73, 6.51, 4.07, 2.24, 5.21, 5.5, 6.03, 24.0]} \ No newline at end of file diff --git a/annotations_filtered/0UlzQ-bao3Q_filtered.json b/annotations_filtered/0UlzQ-bao3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e81d5997b594c4c999ab8a03094ef7525f14c33f --- /dev/null +++ b/annotations_filtered/0UlzQ-bao3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.73], [6.0, 6.89], [7.0, 8.88], [9.0, 12.11], [13.0, 14.08], [16.0, 17.14], [18.0, 18.87], [29.0, 30.35], [32.0, 33.27], [35.0, 36.05], [46.0, 45.79], [48.0, 49.44], [50.0, 50.67], [53.0, 53.77], [58.0, 61.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.52, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.73, 0.89, 1.88, 3.11, 1.08, 1.14, 0.87, 1.35, 1.27, 1.05, -0.21, 1.44, 0.67, 0.77, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/0UrClwjpNA8_filtered.json b/annotations_filtered/0UrClwjpNA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea36312c8e0976e553a14bfc96c4f4b98b0ca6a --- /dev/null +++ b/annotations_filtered/0UrClwjpNA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 40.44], [41.0, 47.04], [49.0, 52.79], [58.0, 59.63], [65.0, 67.0], [69.0, 68.96], [71.0, 71.49], [74.0, 74.26], [75.0, 76.33], [81.0, 82.12], [83.0, 84.03], [88.0, 89.95], [91.0, 91.39], [93.0, 94.24], [95.0, 95.2], [97.0, 143.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 65.67, 53.91, 0.0, 59.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 6.04, 3.79, 1.63, 2.0, -0.04, 0.49, 0.26, 1.33, 1.12, 1.03, 1.95, 0.39, 1.24, 0.2, 46.09]} \ No newline at end of file diff --git a/annotations_filtered/0VYvdsrV6Lw_filtered.json b/annotations_filtered/0VYvdsrV6Lw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a97d0dce54395ff040ed2a72915d3faa7f71ed3e --- /dev/null +++ b/annotations_filtered/0VYvdsrV6Lw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [10.0, 10.44], [11.0, 13.0], [27.0, 27.28], [37.0, 37.61], [44.0, 50.08], [51.0, 57.23], [61.0, 61.37], [66.0, 66.95], [70.0, 71.27], [80.0, 82.17], [90.0, 117.88]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 43.25, 0.0, 0.0, 42.72, 36.43, 0.0, 0.0, 0.0, 32.52, 31.18], "audiomae_on_audioset": [null, null, [["music", 44.44], ["hum", 15.43], ["throbbing", 9.07]], null, null, [["throbbing", 42.08], ["hum", 35.3], ["mains hum", 5.26]], [["music", 36.68], ["hum", 18.7], ["throbbing", 11.64]], null, null, null, [["fly, housefly", 62.09], ["insect", 19.66], ["mosquito", 13.25]], [["grunt", 22.33], ["frog", 21.95], ["livestock, farm animals, working animals", 7.18]]], "duration": [0.51, 0.44, 2.0, 0.28, 0.61, 6.08, 6.23, 0.37, 0.95, 1.27, 2.17, 27.88]} \ No newline at end of file diff --git a/annotations_filtered/0WKopiIhAdI_filtered.json b/annotations_filtered/0WKopiIhAdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3264ca6b89e1bdc5aff37e4db9e966a6b14d50f --- /dev/null +++ b/annotations_filtered/0WKopiIhAdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [6.0, 6.0], [6.0, 11.84], [13.0, 13.91], [25.0, 26.64], [38.0, 42.18], [45.0, 45.4], [46.0, 45.64], [46.0, 52.95], [53.0, 54.16], [55.0, 65.25], [67.0, 70.56], [74.0, 74.71], [75.0, 78.85], [79.0, 80.2], [87.0, 94.17], [110.0, 111.05], [112.0, 112.16], [114.0, 113.98], [114.0, 114.54], [118.0, 126.15], [127.0, 129.46], [132.0, 131.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 38.71, 0.0, 0.0, 32.93, 0.0, 0.0, 30.01, 0.0, 30.4, 32.28, 0.0, 30.56, 0.0, 33.7, 0.0, 0.0, 0.0, 0.0, 47.86, 30.55, 0.0], "audiomae_on_audioset": [null, null, [["speech", 36.51], ["hum", 27.89], ["mains hum", 13.02]], null, null, [["music", 74.8], ["electronic music", 9.66], ["throbbing", 2.91]], null, null, [["music", 79.95], ["sound effect", 2.95], ["boing", 1.86]], null, [["throbbing", 31.05], ["music", 27.65], ["hum", 13.26]], [["music", 58.81], ["speech", 10.24], ["electronic music", 6.58]], null, [["music", 51.76], ["throbbing", 16.55], ["hum", 7.73]], null, [["speech", 41.48], ["music", 32.14], ["echo", 5.16]], null, null, null, null, [["music", 61.83], ["whale vocalization", 6.5], ["squish", 6.37]], [["livestock, farm animals, working animals", 17.89], ["cattle, bovinae", 15.07], ["cowbell", 12.26]], null], "duration": [0.76, 0.0, 5.84, 0.91, 1.64, 4.18, 0.4, -0.36, 6.95, 1.16, 10.25, 3.56, 0.71, 3.85, 1.2, 7.17, 1.05, 0.16, -0.02, 0.54, 8.15, 2.46, -0.28]} \ No newline at end of file diff --git a/annotations_filtered/0WOnDEx4QLc_filtered.json b/annotations_filtered/0WOnDEx4QLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7a29c586c26a1fb2f81b6941f3bb492f2eb5d4c --- /dev/null +++ b/annotations_filtered/0WOnDEx4QLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [5.0, 6.27], [7.0, 10.66], [16.0, 16.14], [21.0, 21.56], [28.0, 28.48], [32.0, 32.64], [33.0, 35.73], [38.0, 43.16], [45.0, 45.44], [50.0, 54.26], [57.0, 57.23], [61.0, 66.31], [66.0, 68.18], [74.0, 74.49], [76.0, 76.35], [84.0, 84.64], [85.0, 86.16], [88.0, 88.21], [88.0, 100.45], [101.0, 111.47], [113.0, 116.21], [119.0, 122.12], [125.0, 125.36], [127.0, 127.45], [128.0, 128.01]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 42.76, 0.0, 0.0, 0.0, 0.0, 42.39, 40.4, 0.0, 36.88, 0.0, 32.49, 32.71, 0.0, 0.0, 0.0, 0.0, 0.0, 33.81, 32.91, 32.55, 97.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.43], ["musical instrument", 7.6], ["guitar", 3.26]], null, null, null, null, [["speech", 25.44], ["music", 18.71], ["foghorn", 9.96]], [["music", 56.15], ["didgeridoo", 11.3], ["bouncing", 5.07]], null, [["music", 42.59], ["coin (dropping)", 9.58], ["thunk", 9.16]], null, [["didgeridoo", 36.62], ["music", 25.31], ["typewriter", 5.57]], [["music", 49.88], ["didgeridoo", 7.19], ["musical instrument", 5.38]], null, null, null, null, null, [["speech", 34.72], ["music", 31.53], ["brass instrument", 5.42]], [["music", 25.01], ["speech", 20.76], ["didgeridoo", 16.81]], [["clang", 20.53], ["music", 14.94], ["ding", 14.93]], null, null, null, null], "duration": [0.22, 1.27, 3.66, 0.14, 0.56, 0.48, 0.64, 2.73, 5.16, 0.44, 4.26, 0.23, 5.31, 2.18, 0.49, 0.35, 0.64, 1.16, 0.21, 12.45, 10.47, 3.21, 3.12, 0.36, 0.45, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/0WRtWiz_Xvg_filtered.json b/annotations_filtered/0WRtWiz_Xvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cbdb43983e14c0d24fc9997be89e3d68a75261c --- /dev/null +++ b/annotations_filtered/0WRtWiz_Xvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.58], [27.0, 27.87], [33.0, 48.93], [50.0, 54.33], [55.0, 56.42], [61.0, 61.28], [65.0, 65.82], [68.0, 70.56], [71.0, 72.42], [79.0, 80.45], [90.0, 90.96], [92.0, 93.14], [94.0, 94.26], [97.0, 103.2], [104.0, 104.08], [107.0, 110.66], [113.0, 117.78], [122.0, 123.89], [124.0, 125.22], [126.0, 136.22], [138.0, 140.12], [142.0, 153.6], [155.0, 166.65], [171.0, 194.53], [196.0, 196.5]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false], "silence_prob": [39.43, 0.0, 51.99, 49.97, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 37.93, 44.6, 0.0, 0.0, 61.77, 76.86, 44.01, 54.3, 41.93, 0.0], "audiomae_on_audioset": [[["speech", 60.84], ["hum", 18.37], ["mains hum", 2.62]], null, null, [["speech", 38.97], ["music", 25.37], ["fart", 5.07]], null, null, null, null, null, null, null, null, null, null, null, [["music", 61.39], ["musical instrument", 4.02], ["breaking", 3.37]], [["music", 35.83], ["theremin", 13.87], ["speech", 7.33]], null, null, null, null, [["music", 55.01], ["speech", 4.75], ["didgeridoo", 3.7]], null, [["music", 68.26], ["didgeridoo", 8.83], ["theremin", 3.88]], null], "duration": [8.58, 0.87, 15.93, 4.33, 1.42, 0.28, 0.82, 2.56, 1.42, 1.45, 0.96, 1.14, 0.26, 6.2, 0.08, 3.66, 4.78, 1.89, 1.22, 10.22, 2.12, 11.6, 11.65, 23.53, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/0WoyXBXCqdg_filtered.json b/annotations_filtered/0WoyXBXCqdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df2a2ba035bfaab707cfbd6f022567e902f19075 --- /dev/null +++ b/annotations_filtered/0WoyXBXCqdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [3.0, 3.55], [7.0, 9.9], [10.0, 10.17], [13.0, 18.82], [21.0, 20.98], [22.0, 22.79], [26.0, 27.23], [33.0, 34.13], [37.0, 37.67], [43.0, 42.94], [49.0, 49.01], [51.0, 51.21], [57.0, 57.52], [62.0, 62.51], [64.0, 63.86], [66.0, 67.12], [80.0, 80.64], [94.0, 94.53], [95.0, 96.42], [99.0, 99.12], [100.0, 102.3], [104.0, 104.5], [126.0, 128.93], [130.0, 131.06], [132.0, 136.11], [139.0, 138.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.98, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 35.5, 0.0, 65.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["breaking", 51.08], ["glass", 30.33], ["music", 13.52]], null, null, null], "duration": [0.41, 0.55, 2.9, 0.17, 5.82, -0.02, 0.79, 1.23, 1.13, 0.67, -0.06, 0.01, 0.21, 0.52, 0.51, -0.14, 1.12, 0.64, 0.53, 1.42, 0.12, 2.3, 0.5, 2.93, 1.06, 4.11, -0.31]} \ No newline at end of file diff --git a/annotations_filtered/0Wt72bHrHFo_filtered.json b/annotations_filtered/0Wt72bHrHFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deb43529a226e93c2c7e49311774f705c72cba1a --- /dev/null +++ b/annotations_filtered/0Wt72bHrHFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 37.72], [47.0, 60.44], [63.0, 63.63], [66.0, 70.48], [79.0, 79.52], [81.0, 91.77], [95.0, 116.48], [119.0, 120.01], [124.0, 127.92], [130.0, 142.25], [145.0, 155.33]], "keep_status": [false, true, false, true, false, false, true, false, false, true, true], "silence_prob": [0.0, 30.22, 0.0, 29.91, 0.0, 30.26, 29.91, 0.0, 31.03, 30.45, 30.43], "audiomae_on_audioset": [null, [["buzz", 30.47], ["speech", 7.07], ["whack, thwack", 6.63]], null, [["speech", 34.28], ["vehicle", 12.03], ["whale vocalization", 7.23]], null, [["music", 42.24], ["speech", 21.44], ["vehicle", 6.96]], [["speech", 33.23], ["music", 20.86], ["vehicle", 9.14]], null, [["mains hum", 49.68], ["hum", 23.25], ["throbbing", 4.37]], [["music", 40.49], ["speech", 18.55], ["hum", 7.74]], [["speech", 26.16], ["music", 22.64], ["whack, thwack", 8.78]]], "duration": [31.72, 13.44, 0.63, 4.48, 0.52, 10.77, 21.48, 1.01, 3.92, 12.25, 10.33]} \ No newline at end of file diff --git a/annotations_filtered/0WtDmbr9xyY_filtered.json b/annotations_filtered/0WtDmbr9xyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8f9f6a32fc7a89a52da3a5a64f83bd415b68ce --- /dev/null +++ b/annotations_filtered/0WtDmbr9xyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 64.96], [70.0, 72.64], [76.0, 76.35], [77.0, 83.39], [87.0, 87.66], [88.0, 89.19], [90.0, 90.75], [92.0, 92.21], [93.0, 93.78], [94.0, 95.23], [96.0, 96.69], [97.0, 98.09], [99.0, 99.52], [100.0, 101.07], [102.0, 102.68], [103.0, 104.21], [105.0, 104.67], [105.0, 104.7]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.86, 0.0, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.1], ["quack", 7.13], ["music", 3.13]], null, [["fly, housefly", 51.71], ["insect", 24.01], ["bee, wasp, etc.", 7.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 2.64, 0.35, 6.39, 0.66, 1.19, 0.75, 0.21, 0.78, 1.23, 0.69, 1.09, 0.52, 1.07, 0.68, 1.21, -0.33, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/0WuMU0zi02w_filtered.json b/annotations_filtered/0WuMU0zi02w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdb9cbc7c60ddbb8d55423464b999d26a3df57d3 --- /dev/null +++ b/annotations_filtered/0WuMU0zi02w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 49.86], [53.0, 71.95], [73.0, 82.59], [84.0, 95.96], [99.0, 102.05], [105.0, 107.16]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 64.52, 96.29, 34.83, 86.27, 57.25], "audiomae_on_audioset": [null, null, null, [["speech", 38.85], ["whack, thwack", 10.98], ["thunk", 10.68]], null, null], "duration": [35.86, 18.95, 9.59, 11.96, 3.05, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/0XCqc9fIGJ0_filtered.json b/annotations_filtered/0XCqc9fIGJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9359d3055897aa30bd7211523fdeaf2582263db5 --- /dev/null +++ b/annotations_filtered/0XCqc9fIGJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.93], [18.0, 18.2], [18.0, 18.27], [18.0, 18.72], [20.0, 36.91], [38.0, 38.77], [85.0, 85.78], [87.0, 88.79], [94.0, 94.83], [95.0, 96.53], [98.0, 98.69], [100.0, 100.82], [102.0, 102.73], [104.0, 103.99], [104.0, 104.14], [105.0, 105.97], [107.0, 108.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 51.51], ["music", 24.57], ["speech", 12.68]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.2, 0.27, 0.72, 16.91, 0.77, 0.78, 1.79, 0.83, 1.53, 0.69, 0.82, 0.73, -0.01, 0.14, 0.97, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/0XLEGFSKVhs_filtered.json b/annotations_filtered/0XLEGFSKVhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b12fc737f14afbe25e5b0dc9ba16e0d7e746ee --- /dev/null +++ b/annotations_filtered/0XLEGFSKVhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.29], [13.0, 15.63], [16.0, 19.62], [26.0, 50.82], [53.0, 81.19], [81.0, 85.04]], "keep_status": [false, true, false, true, false, true], "silence_prob": [38.11, 36.31, 70.44, 28.94, 29.19, 37.78], "audiomae_on_audioset": [[["mains hum", 27.06], ["hum", 23.23], ["throbbing", 22.2]], [["music", 44.61], ["synthesizer", 11.21], ["musical instrument", 7.24]], null, [["music", 52.28], ["synthesizer", 8.78], ["electronic music", 6.38]], [["music", 91.29], ["drip", 2.47], ["liquid", 1.0]], [["speech", 30.52], ["frog", 12.5], ["croak", 8.13]]], "duration": [6.29, 2.63, 3.62, 24.82, 28.19, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/0XesK2hB_Wk_filtered.json b/annotations_filtered/0XesK2hB_Wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d503ffbc9a0666aa443d76dd6c366a46f8e3ba4 --- /dev/null +++ b/annotations_filtered/0XesK2hB_Wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.96], [38.0, 37.71], [40.0, 39.78], [47.0, 47.56], [51.0, 51.88], [56.0, 57.42], [59.0, 66.09], [69.0, 79.59], [82.0, 82.49], [85.0, 86.24], [88.0, 88.89], [90.0, 91.47], [96.0, 96.5], [98.0, 98.37], [99.0, 100.77], [102.0, 102.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, -0.29, -0.22, 0.56, 0.88, 1.42, 7.09, 10.59, 0.49, 1.24, 0.89, 1.47, 0.5, 0.37, 1.77, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/0XjLzDVi03c_filtered.json b/annotations_filtered/0XjLzDVi03c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a85efcd7b7fba8ee6dede3cb31d71aed2df0b1d --- /dev/null +++ b/annotations_filtered/0XjLzDVi03c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 18.45], [19.0, 18.52], [19.0, 21.07], [22.0, 35.88], [38.0, 50.94], [52.0, 53.97], [55.0, 56.57], [59.0, 60.1], [63.0, 65.15], [67.0, 69.63], [73.0, 75.1], [78.0, 98.47], [100.0, 107.3], [109.0, 114.49], [116.0, 118.89], [119.0, 121.76], [123.0, 125.19]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.64, 0.0, 49.09, 35.83, 35.48, 0.0, 0.0, 0.0, 78.04, 64.52, 68.54, 49.87, 50.21, 94.95, 94.22, 98.99, 99.87], "audiomae_on_audioset": [null, null, [["music", 75.24], ["didgeridoo", 3.66], ["musical instrument", 2.7]], [["music", 52.14], ["musical instrument", 3.84], ["hum", 3.49]], [["music", 67.42], ["theremin", 5.37], ["hum", 5.0]], null, null, null, null, null, null, [["music", 63.89], ["theremin", 21.12], ["ambient music", 4.06]], null, null, null, null, null], "duration": [16.45, -0.48, 2.07, 13.88, 12.94, 1.97, 1.57, 1.1, 2.15, 2.63, 2.1, 20.47, 7.3, 5.49, 2.89, 2.76, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/0XzQX-i3y_I_filtered.json b/annotations_filtered/0XzQX-i3y_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba79ca7c65aaf0a670eecb6bbfca5ce9838058ce --- /dev/null +++ b/annotations_filtered/0XzQX-i3y_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [6.0, 7.84], [8.0, 10.2], [11.0, 11.53], [13.0, 14.07], [15.0, 17.59], [18.0, 18.62], [20.0, 37.34], [38.0, 40.53], [41.0, 43.85], [44.0, 49.99], [51.0, 52.05], [53.0, 53.59], [55.0, 55.85], [56.0, 58.08], [59.0, 59.9], [61.0, 61.42], [62.0, 68.05], [70.0, 70.21], [74.0, 74.71], [75.0, 76.0], [78.0, 78.73], [80.0, 80.43], [84.0, 83.96], [86.0, 86.24], [87.0, 89.9], [100.0, 100.03], [101.0, 101.92], [103.0, 103.96], [105.0, 105.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 100.0, 0.0, 36.31, 68.02, 99.73, 61.37, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 65.14], ["trombone", 10.16], ["brass instrument", 10.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 1.84, 2.2, 0.53, 1.07, 2.59, 0.62, 17.34, 2.53, 2.85, 5.99, 1.05, 0.59, 0.85, 2.08, 0.9, 0.42, 6.05, 0.21, 0.71, 1.0, 0.73, 0.43, -0.04, 0.24, 2.9, 0.03, 0.92, 0.96, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/0YDejqKggWA_filtered.json b/annotations_filtered/0YDejqKggWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12acef15741e1880e70f67dec89aea0f7b4ca91f --- /dev/null +++ b/annotations_filtered/0YDejqKggWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [5.0, 5.85], [7.0, 7.91], [8.0, 10.25], [11.0, 15.5], [17.0, 17.22], [19.0, 21.14], [22.0, 23.23], [27.0, 27.53], [29.0, 30.54], [31.0, 32.58], [34.0, 37.62], [44.0, 45.93], [47.0, 48.32], [52.0, 52.59], [54.0, 59.53], [61.0, 65.47], [66.0, 67.71], [71.0, 72.35], [74.0, 76.33], [77.0, 79.24], [83.0, 91.64], [92.0, 94.78], [98.0, 99.82], [102.0, 103.76], [104.0, 105.61], [109.0, 110.25], [111.0, 111.99], [112.0, 136.93], [138.0, 141.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 83.52, 90.95, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 100.0, 94.37, 99.93, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 0.85, 0.91, 2.25, 4.5, 0.22, 2.14, 1.23, 0.53, 1.54, 1.58, 3.62, 1.93, 1.32, 0.59, 5.53, 4.47, 1.71, 1.35, 2.33, 2.24, 8.64, 2.78, 1.82, 1.76, 1.61, 1.25, 0.99, 24.93, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/0YOmyGX2kmQ_filtered.json b/annotations_filtered/0YOmyGX2kmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67d6485afca5d140db0bbed9ab6c785af53d3d29 --- /dev/null +++ b/annotations_filtered/0YOmyGX2kmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.33], [9.0, 13.19], [14.0, 17.66], [18.0, 18.22], [19.0, 24.0], [25.0, 33.24], [34.0, 34.87], [35.0, 36.19], [38.0, 50.04], [54.0, 55.97], [57.0, 64.0], [66.0, 66.02]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 50.16, 40.28, 0.0, 86.82, 89.01, 0.0, 0.0, 36.42, 0.0, 35.82, 0.0], "audiomae_on_audioset": [null, null, [["speech", 21.15], ["goose", 13.67], ["fowl", 12.77]], null, null, null, null, null, [["music", 51.04], ["speech", 18.95], ["animal", 4.44]], null, [["music", 28.39], ["speech", 19.02], ["foghorn", 6.53]], null], "duration": [1.33, 4.19, 3.66, 0.22, 5.0, 8.24, 0.87, 1.19, 12.04, 1.97, 7.0, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/0YzsWVUO-_o_filtered.json b/annotations_filtered/0YzsWVUO-_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f47fd68c646473c35649d51ac46edf0a1a2d2c39 --- /dev/null +++ b/annotations_filtered/0YzsWVUO-_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[99.0, 101.75]], "keep_status": [true], "silence_prob": [45.11], "audiomae_on_audioset": [[["music", 33.66], ["speech", 14.64], ["brass instrument", 8.51]]], "duration": [2.75]} \ No newline at end of file diff --git a/annotations_filtered/0Z286w5pRSo_filtered.json b/annotations_filtered/0Z286w5pRSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f7084c1640da17e11c0b51f916299a1b28e0722 --- /dev/null +++ b/annotations_filtered/0Z286w5pRSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.05], [5.0, 7.15], [9.0, 10.17], [13.0, 14.91], [16.0, 17.44], [22.0, 25.89], [32.0, 32.34], [34.0, 35.06], [38.0, 39.04], [42.0, 42.85], [46.0, 46.65], [47.0, 48.22], [50.0, 50.13], [52.0, 53.18], [55.0, 57.35], [59.0, 61.28]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.44, 96.04, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 99.97], "audiomae_on_audioset": [[["sidetone", 50.5], ["guitar", 5.66], ["effects unit", 5.52]], null, null, null, null, [["sine wave", 32.51], ["speech", 19.6], ["dial tone", 18.38]], null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 2.15, 1.17, 1.91, 1.44, 3.89, 0.34, 1.06, 1.04, 0.85, 0.65, 1.22, 0.13, 1.18, 2.35, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/0ZQln6DsWgE_filtered.json b/annotations_filtered/0ZQln6DsWgE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f42d7cea83b1486f109a16f61623b7bbda7165a --- /dev/null +++ b/annotations_filtered/0ZQln6DsWgE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.37], [11.0, 19.6], [20.0, 20.28], [21.0, 21.14], [27.0, 28.29], [28.0, 37.81], [38.0, 37.88], [38.0, 43.58], [45.0, 46.6], [48.0, 48.46], [51.0, 52.32], [54.0, 58.33], [68.0, 68.89], [71.0, 72.13], [74.0, 75.24], [77.0, 77.63], [80.0, 81.28], [82.0, 83.02], [89.0, 90.0], [90.0, 90.51], [93.0, 93.02], [99.0, 99.69], [102.0, 102.36], [105.0, 109.31], [110.0, 111.11], [114.0, 115.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.08, 100.0, 0.0, 0.0, 0.0, 99.36, 0.0, 99.93, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.37, 8.6, 0.28, 0.14, 1.29, 9.81, -0.12, 5.58, 1.6, 0.46, 1.32, 4.33, 0.89, 1.13, 1.24, 0.63, 1.28, 1.02, 1.0, 0.51, 0.02, 0.69, 0.36, 4.31, 1.11, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/0ZzNlA9uZ0g_filtered.json b/annotations_filtered/0ZzNlA9uZ0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42741dd17a0ad522c6ebd74bdeb973cd3308252e --- /dev/null +++ b/annotations_filtered/0ZzNlA9uZ0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.57], [11.0, 19.21], [21.0, 24.02], [24.0, 25.54], [27.0, 27.58], [28.0, 28.31], [28.0, 29.96], [31.0, 38.77], [41.0, 45.59], [46.0, 48.02], [49.0, 53.0], [54.0, 57.3], [58.0, 58.77], [59.0, 59.71], [62.0, 63.32], [64.0, 82.24], [83.0, 84.13], [85.0, 87.71], [95.0, 96.82], [97.0, 98.91], [102.0, 102.25], [104.0, 105.22], [106.0, 112.4], [113.0, 115.86], [118.0, 125.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [98.51, 89.54, 99.98, 0.0, 0.0, 0.0, 0.0, 99.73, 94.22, 77.53, 49.22, 94.52, 0.0, 0.0, 0.0, 95.23, 0.0, 28.87, 0.0, 0.0, 0.0, 0.0, 33.76, 35.88, 38.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 38.41], ["sine wave", 38.03], ["dial tone", 7.13]], null, null, null, null, null, null, [["siren", 37.7], ["emergency vehicle", 21.03], ["police car (siren)", 11.51]], null, null, null, null, [["siren", 36.1], ["civil defense siren", 13.56], ["speech", 11.35]], [["frog", 36.13], ["siren", 15.41], ["civil defense siren", 7.93]], [["siren", 28.99], ["civil defense siren", 11.03], ["police car (siren)", 7.29]]], "duration": [9.57, 8.21, 3.02, 1.54, 0.58, 0.31, 1.96, 7.77, 4.59, 2.02, 4.0, 3.3, 0.77, 0.71, 1.32, 18.24, 1.13, 2.71, 1.82, 1.91, 0.25, 1.22, 6.4, 2.86, 7.73]} \ No newline at end of file diff --git a/annotations_filtered/0_-45EGFtA4_filtered.json b/annotations_filtered/0_-45EGFtA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f94911116513406f4155d2c86ed837bcf96c8c90 --- /dev/null +++ b/annotations_filtered/0_-45EGFtA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.69]} \ No newline at end of file diff --git a/annotations_filtered/0_0U4bhe6ag_filtered.json b/annotations_filtered/0_0U4bhe6ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0e6660e727674d230b0cdfdecc1e9848fc6fd62 --- /dev/null +++ b/annotations_filtered/0_0U4bhe6ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.89], [10.0, 10.05], [18.0, 22.33], [28.0, 28.65], [39.0, 39.93], [50.0, 50.63], [57.0, 58.48], [61.0, 61.67], [65.0, 66.28], [67.0, 67.47], [68.0, 68.67], [82.0, 84.2], [84.0, 87.64], [91.0, 93.28], [96.0, 105.29], [109.0, 110.84], [112.0, 112.31], [115.0, 115.5], [116.0, 116.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 35.5, 35.82, 32.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.91], ["effects unit", 4.16], ["musical instrument", 4.15]], null, null, null, null, null, null, null, null, [["whale vocalization", 32.63], ["speech", 13.33], ["music", 8.35]], [["music", 41.71], ["speech", 13.18], ["hum", 5.93]], [["music", 62.4], ["whale vocalization", 13.46], ["hum", 4.67]], [["speech", 23.5], ["music", 18.17], ["hum", 2.6]], null, null, null, null], "duration": [-0.11, 0.05, 4.33, 0.65, 0.93, 0.63, 1.48, 0.67, 1.28, 0.47, 0.67, 2.2, 3.64, 2.28, 9.29, 1.84, 0.31, 0.5, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/0_1NU60qHWs_filtered.json b/annotations_filtered/0_1NU60qHWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09414d554151477b07e0766d142aa78c142caf4c --- /dev/null +++ b/annotations_filtered/0_1NU60qHWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.07], [13.0, 13.24], [14.0, 14.01], [18.0, 17.61], [18.0, 23.06], [29.0, 28.88], [30.0, 30.21], [46.0, 47.76], [51.0, 51.68], [54.0, 54.62], [56.0, 60.51], [65.0, 65.31], [65.0, 66.14], [66.0, 66.28], [66.0, 66.43], [71.0, 72.06], [78.0, 78.66], [81.0, 80.81], [84.0, 84.25], [85.0, 85.45], [88.0, 87.76], [91.0, 93.07], [95.0, 98.44], [107.0, 111.54], [125.0, 126.55], [127.0, 129.3], [132.0, 132.09], [142.0, 143.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 53.28, 45.24, 0.0, 71.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.28], ["marimba, xylophone", 6.22], ["glockenspiel", 3.12]], null, [["speech", 33.35], ["music", 27.8], ["boing", 6.41]], null, null, null, null], "duration": [1.07, 0.24, 0.01, -0.39, 5.06, -0.12, 0.21, 1.76, 0.68, 0.62, 4.51, 0.31, 1.14, 0.28, 0.43, 1.06, 0.66, -0.19, 0.25, 0.45, -0.24, 2.07, 3.44, 4.54, 1.55, 2.3, 0.09, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/0_7vIOvdKqY_filtered.json b/annotations_filtered/0_7vIOvdKqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..726a259a3cd7d61fa98d3587186673eb550c720c --- /dev/null +++ b/annotations_filtered/0_7vIOvdKqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [4.0, 13.85], [14.0, 19.48], [34.0, 35.01], [35.0, 36.86], [39.0, 39.58], [42.0, 43.34], [44.0, 45.35], [46.0, 49.4], [50.0, 58.51], [60.0, 60.2], [63.0, 64.25], [66.0, 67.36], [71.0, 72.55], [76.0, 76.45], [79.0, 81.85], [84.0, 85.09], [86.0, 86.78], [91.0, 95.17], [97.0, 98.05], [100.0, 100.09], [101.0, 104.18], [105.0, 107.33], [109.0, 110.49], [113.0, 115.11], [116.0, 117.12], [122.0, 123.4], [124.0, 123.9], [124.0, 124.34], [127.0, 129.37], [130.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.26, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 99.56, 0.0, 0.0, 99.65, 99.48, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0], "audiomae_on_audioset": [null, [["speech", 92.2], ["sidetone", 2.74], ["whale vocalization", 1.23]], [["speech", 80.91], ["fart", 6.56], ["beatboxing", 5.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 9.85, 5.48, 1.01, 1.86, 0.58, 1.34, 1.35, 3.4, 8.51, 0.2, 1.25, 1.36, 1.55, 0.45, 2.85, 1.09, 0.78, 4.17, 1.05, 0.09, 3.18, 2.33, 1.49, 2.11, 1.12, 1.4, -0.1, 0.34, 2.37, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/0_ArO8UCfyk_filtered.json b/annotations_filtered/0_ArO8UCfyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c812a6e7f096a9f1f51f608a91d998cc7615dc73 --- /dev/null +++ b/annotations_filtered/0_ArO8UCfyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [4.0, 4.68], [8.0, 8.78], [11.0, 13.73], [17.0, 17.2], [21.0, 21.36], [23.0, 24.26], [26.0, 25.66], [26.0, 27.19], [32.0, 35.67], [39.0, 40.09], [41.0, 42.85], [53.0, 53.76], [59.0, 60.59], [62.0, 62.92], [68.0, 68.99], [70.0, 71.32], [72.0, 75.95], [77.0, 77.5], [79.0, 80.05], [81.0, 96.48], [97.0, 98.37], [101.0, 101.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 51.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.68, 0.78, 2.73, 0.2, 0.36, 1.26, -0.34, 1.19, 3.67, 1.09, 1.85, 0.76, 1.59, 0.92, 0.99, 1.32, 3.95, 0.5, 1.05, 15.48, 1.37, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/0_UCPY-mSZU_filtered.json b/annotations_filtered/0_UCPY-mSZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf63341e69d780fbddf205105988a4297c2fb85 --- /dev/null +++ b/annotations_filtered/0_UCPY-mSZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [25.0, 26.84], [28.0, 29.32], [32.0, 32.63], [39.0, 39.78], [44.0, 48.98], [49.0, 52.22], [58.0, 58.75], [65.0, 65.53], [66.0, 66.06], [68.0, 69.36], [70.0, 71.83], [75.0, 76.23], [82.0, 93.93], [95.0, 100.74], [103.0, 106.86], [108.0, 109.0], [111.0, 114.59], [116.0, 116.73], [118.0, 119.45], [124.0, 125.71], [127.0, 127.82], [132.0, 135.77], [137.0, 139.99], [142.0, 150.36], [153.0, 154.95], [155.0, 156.59], [158.0, 159.85], [160.0, 162.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.99, 95.64, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 63.42, 51.94, 55.04, 0.0, 0.0, 0.0, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 1.84, 1.32, 0.63, 0.78, 4.98, 3.22, 0.75, 0.53, 0.06, 1.36, 1.83, 1.23, 11.93, 5.74, 3.86, 1.0, 3.59, 0.73, 1.45, 1.71, 0.82, 3.77, 2.99, 8.36, 1.95, 1.59, 1.85, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/0_hajel24IE_filtered.json b/annotations_filtered/0_hajel24IE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f02bb05593c7ce7096f3e75d3b0f3b84a24183eb --- /dev/null +++ b/annotations_filtered/0_hajel24IE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.32], [16.0, 17.85], [19.0, 18.93], [19.0, 33.84], [34.0, 34.7], [35.0, 35.33], [35.0, 43.07], [44.0, 44.07], [44.0, 115.16], [118.0, 120.53], [122.0, 122.25], [124.0, 123.74]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 86.82, 0.0, 0.0, 30.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 17.47], ["vehicle", 13.93], ["moo", 10.82]], null, null], "duration": [1.32, 1.85, -0.07, 14.84, 0.7, 0.33, 8.07, 0.07, 71.16, 2.53, 0.25, -0.26]} \ No newline at end of file diff --git a/annotations_filtered/0_m8AmAm-XE_filtered.json b/annotations_filtered/0_m8AmAm-XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b62a86eb9b136ac448a7d98848f178639a040fdb --- /dev/null +++ b/annotations_filtered/0_m8AmAm-XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 37.13], [40.0, 67.27], [67.0, 67.31], [67.0, 67.34], [68.0, 67.58], [68.0, 76.35], [79.0, 94.96], [98.0, 110.08], [110.0, 110.3], [119.0, 119.52]], "keep_status": [false, true, false, false, false, true, false, true, false, false], "silence_prob": [40.97, 41.36, 0.0, 0.0, 0.0, 36.47, 36.39, 37.08, 0.0, 0.0], "audiomae_on_audioset": [[["theremin", 56.79], ["music", 24.56], ["didgeridoo", 2.63]], [["music", 38.63], ["brass instrument", 8.1], ["trombone", 7.97]], null, null, null, [["music", 30.97], ["whale vocalization", 16.34], ["percussion", 10.35]], [["music", 59.25], ["drum", 5.6], ["brass instrument", 5.41]], [["music", 40.52], ["tabla", 7.66], ["musical instrument", 7.14]], null, null], "duration": [4.13, 27.27, 0.31, 0.34, -0.42, 8.35, 15.96, 12.08, 0.3, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/0_pN-X7Gew8_filtered.json b/annotations_filtered/0_pN-X7Gew8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f18ba561d76aa1891049cb084f2e4d57bcbe5dd --- /dev/null +++ b/annotations_filtered/0_pN-X7Gew8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [5.0, 5.78], [7.0, 9.76], [11.0, 29.67], [32.0, 84.6], [85.0, 85.67], [86.0, 89.72], [93.0, 107.33], [111.0, 111.13], [112.0, 125.88]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 70.16, 36.01, 0.0, 0.0, 45.27, 40.86, 0.0, 37.49], "audiomae_on_audioset": [null, null, null, [["music", 62.35], ["neigh, whinny", 9.23], ["horse", 5.52]], null, null, [["music", 39.1], ["theremin", 26.24], ["foghorn", 4.28]], [["music", 59.38], ["theremin", 15.64], ["ambient music", 4.67]], null, [["music", 63.14], ["theremin", 8.29], ["brass instrument", 4.07]]], "duration": [0.81, 0.78, 2.76, 18.67, 52.6, 0.67, 3.72, 14.33, 0.13, 13.88]} \ No newline at end of file diff --git a/annotations_filtered/0aKB_Qm-z6g_filtered.json b/annotations_filtered/0aKB_Qm-z6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..706634bfa859e153adffe1c29ecad8080dbdacee --- /dev/null +++ b/annotations_filtered/0aKB_Qm-z6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [8.0, 8.28], [9.0, 10.79], [11.0, 13.71], [14.0, 15.21], [17.0, 22.38], [29.0, 29.66], [36.0, 36.56], [39.0, 39.46], [44.0, 44.95], [49.0, 50.09], [52.0, 54.45], [56.0, 58.36], [63.0, 64.1], [72.0, 74.12], [75.0, 76.06], [81.0, 83.27], [84.0, 91.2], [92.0, 92.5], [106.0, 106.54], [111.0, 117.39], [117.0, 118.89]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 40.59, 0.0, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 51.02, 0.0, 99.98, 0.0, 79.59, 33.28, 0.0, 0.0, 34.03, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 54.9], ["sidetone", 24.84], ["hum", 2.83]], null, [["speech", 16.15], ["mosquito", 12.84], ["fly, housefly", 9.52]], null, null, null, null, null, null, null, null, null, null, null, [["whistling", 95.31], ["beatboxing", 1.41], ["speech", 0.59]], null, null, [["music", 49.71], ["guitar", 9.14], ["musical instrument", 4.78]], null], "duration": [0.88, 0.28, 1.79, 2.71, 1.21, 5.38, 0.66, 0.56, 0.46, 0.95, 1.09, 2.45, 2.36, 1.1, 2.12, 1.06, 2.27, 7.2, 0.5, 0.54, 6.39, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/0aX79Yt3Bno_filtered.json b/annotations_filtered/0aX79Yt3Bno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5395bb81dd57e34f28c5d75a7d17e7048f6f1fd9 --- /dev/null +++ b/annotations_filtered/0aX79Yt3Bno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.18], [10.0, 16.29], [16.0, 17.19], [22.0, 22.06], [25.0, 26.72], [29.0, 31.24], [49.0, 53.03], [53.0, 60.39], [70.0, 72.57], [85.0, 85.5], [92.0, 94.49], [111.0, 113.27], [115.0, 124.06]], "keep_status": [true, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [33.95, 42.58, 0.0, 0.0, 0.0, 56.7, 80.29, 56.48, 59.77, 0.0, 30.64, 32.72, 30.65], "audiomae_on_audioset": [[["speech", 37.56], ["music", 9.27], ["explosion", 6.16]], [["speech", 47.93], ["frog", 11.28], ["animal", 7.89]], null, null, null, null, null, null, null, null, [["speech", 23.88], ["gunshot, gunfire", 13.29], ["whack, thwack", 12.82]], [["frog", 22.78], ["animal", 13.49], ["boing", 7.22]], [["cattle, bovinae", 20.96], ["speech", 19.67], ["animal", 10.16]]], "duration": [6.18, 6.29, 1.19, 0.06, 1.72, 2.24, 4.03, 7.39, 2.57, 0.5, 2.49, 2.27, 9.06]} \ No newline at end of file diff --git a/annotations_filtered/0adv8zQsa9I_filtered.json b/annotations_filtered/0adv8zQsa9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc5eb3b7e0e7f8dde40877685760bcbdee1d57f8 --- /dev/null +++ b/annotations_filtered/0adv8zQsa9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [3.0, 6.71], [8.0, 9.95], [11.0, 14.77], [15.0, 17.96], [19.0, 32.22], [33.0, 35.23], [36.0, 38.01], [39.0, 39.92], [42.0, 43.11], [46.0, 46.89], [48.0, 50.3], [52.0, 54.92], [55.0, 58.36], [59.0, 63.31], [64.0, 66.95], [69.0, 74.14], [76.0, 76.27], [77.0, 79.14], [80.0, 80.08], [81.0, 81.85], [83.0, 83.17], [86.0, 87.22], [90.0, 90.41], [92.0, 93.31], [95.0, 99.62], [103.0, 104.77], [107.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.0, 0.0, 100.0, 100.0, 98.01, 81.89, 100.0, 0.0, 0.0, 0.0, 100.0, 66.51, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 3.71, 1.95, 3.77, 2.96, 13.22, 2.23, 2.01, 0.92, 1.11, 0.89, 2.3, 2.92, 3.36, 4.31, 2.95, 5.14, 0.27, 2.14, 0.08, 0.85, 0.17, 1.22, 0.41, 1.31, 4.62, 1.77, 25.63]} \ No newline at end of file diff --git a/annotations_filtered/0atATbXbQ9g_filtered.json b/annotations_filtered/0atATbXbQ9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70e8240381adb403af7a3626f9164321ab602a39 --- /dev/null +++ b/annotations_filtered/0atATbXbQ9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [4.0, 5.73], [7.0, 8.83], [10.0, 12.48], [15.0, 17.1], [20.0, 22.06], [27.0, 28.14], [29.0, 29.88], [34.0, 35.36]], "keep_status": [false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.64, 43.98, 42.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 31.7], ["didgeridoo", 21.51], ["insect", 7.26]], [["music", 41.55], ["theremin", 12.21], ["musical instrument", 5.53]], [["music", 19.09], ["speech", 8.22], ["didgeridoo", 8.0]], null, null, null], "duration": [0.46, 1.73, 1.83, 2.48, 2.1, 2.06, 1.14, 0.88, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/0bR6pUOhZo4_filtered.json b/annotations_filtered/0bR6pUOhZo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c49615a738485c8d8099b4c35743bcca264a2e --- /dev/null +++ b/annotations_filtered/0bR6pUOhZo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.63], [17.0, 20.78], [24.0, 24.68], [30.0, 30.64], [44.0, 44.58], [48.0, 49.37], [53.0, 54.09], [55.0, 65.03], [67.0, 67.29], [70.0, 70.58], [72.0, 75.3], [77.0, 77.9], [80.0, 81.03], [83.0, 84.03], [86.0, 86.31], [89.0, 89.09], [91.0, 92.2], [97.0, 97.93], [101.0, 102.49], [105.0, 106.46], [109.0, 110.32], [116.0, 116.29], [122.0, 123.79], [126.0, 142.87], [144.0, 146.72], [151.0, 151.21], [151.0, 151.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.29, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 68.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.63, 3.78, 0.68, 0.64, 0.58, 1.37, 1.09, 10.03, 0.29, 0.58, 3.3, 0.9, 1.03, 1.03, 0.31, 0.09, 1.2, 0.93, 1.49, 1.46, 1.32, 0.29, 1.79, 16.87, 2.72, 0.21, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/0bRr_MER6Vg_filtered.json b/annotations_filtered/0bRr_MER6Vg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e6f2407d1adee4f41eb777d50ebdffda6ca5a42 --- /dev/null +++ b/annotations_filtered/0bRr_MER6Vg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.27], [9.0, 9.46], [14.0, 14.77], [19.0, 18.72], [34.0, 34.43], [36.0, 37.02], [40.0, 40.91], [44.0, 44.56], [61.0, 61.37], [74.0, 74.66], [80.0, 80.54], [85.0, 86.02], [98.0, 97.93], [100.0, 101.48], [115.0, 116.07], [117.0, 117.26], [118.0, 118.59], [133.0, 133.83], [147.0, 149.37], [154.0, 155.01], [156.0, 156.44], [157.0, 157.67], [161.0, 161.92], [172.0, 173.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.46, 0.77, -0.28, 0.43, 1.02, 0.91, 0.56, 0.37, 0.66, 0.54, 1.02, -0.07, 1.48, 1.07, 0.26, 0.59, 0.83, 2.37, 1.01, 0.44, 0.67, 0.92, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/0bbWQy30oc8_filtered.json b/annotations_filtered/0bbWQy30oc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..083919fd7bc7739fb6caf921680002c3463fe362 --- /dev/null +++ b/annotations_filtered/0bbWQy30oc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.08], [7.0, 23.65], [29.0, 51.41], [54.0, 54.94], [56.0, 58.23], [59.0, 59.86], [61.0, 80.81], [81.0, 81.73], [84.0, 92.3], [95.0, 97.26], [100.0, 100.26]], "keep_status": [true, true, true, false, true, false, true, false, false, true, false], "silence_prob": [40.28, 32.11, 30.99, 0.0, 31.85, 0.0, 30.5, 0.0, 31.52, 35.1, 0.0], "audiomae_on_audioset": [[["music", 24.92], ["speech", 14.81], ["bee, wasp, etc.", 9.26]], [["speech", 30.72], ["fly, housefly", 19.83], ["music", 11.69]], [["speech", 38.27], ["buzz", 9.16], ["hum", 9.01]], null, [["music", 21.69], ["vehicle", 9.63], ["speech", 5.19]], null, [["music", 26.47], ["hum", 11.71], ["buzz", 7.79]], null, [["music", 69.75], ["boing", 19.04], ["speech", 1.4]], [["music", 30.79], ["guitar", 10.86], ["musical instrument", 9.43]], null], "duration": [2.08, 16.65, 22.41, 0.94, 2.23, 0.86, 19.81, 0.73, 8.3, 2.26, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/0bkaFNVY2UQ_filtered.json b/annotations_filtered/0bkaFNVY2UQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e6f817fc7e3509fe1fd6a2cccc9c68ac2b2ae2 --- /dev/null +++ b/annotations_filtered/0bkaFNVY2UQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [4.0, 5.19], [7.0, 9.41], [11.0, 12.06], [14.0, 14.54], [19.0, 20.06], [25.0, 25.51], [27.0, 27.63], [28.0, 29.08], [30.0, 30.69], [32.0, 33.88], [43.0, 44.54], [51.0, 52.15], [53.0, 56.25], [59.0, 60.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.19, 2.41, 1.06, 0.54, 1.06, 0.51, 0.63, 1.08, 0.69, 1.88, 1.54, 1.15, 3.25, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/0bw8UM1eLFo_filtered.json b/annotations_filtered/0bw8UM1eLFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21061c9aabeef186692011699d2dcb5d8282ace9 --- /dev/null +++ b/annotations_filtered/0bw8UM1eLFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [6.0, 13.73], [16.0, 19.5], [21.0, 28.07], [29.0, 36.31], [39.0, 44.02], [45.0, 47.68], [49.0, 51.17], [55.0, 55.68], [57.0, 57.45], [59.0, 60.1], [64.0, 65.57], [67.0, 68.22], [69.0, 70.9], [72.0, 88.97], [90.0, 95.74], [98.0, 104.19], [107.0, 110.49], [112.0, 118.67], [120.0, 127.16], [127.0, 146.33], [148.0, 156.02], [165.0, 167.16], [169.0, 170.36], [172.0, 172.13], [179.0, 180.37], [181.0, 199.93], [200.0, 202.05], [203.0, 205.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 100.0, 100.0, 100.0, 98.86, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 99.84, 96.42, 100.0, 100.0, 100.0, 97.73, 32.59, 37.34, 0.0, 0.0, 0.0, 56.48, 61.08, 69.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.83], ["sidetone", 17.23], ["noise", 2.15]], [["fly, housefly", 27.21], ["insect", 16.22], ["mosquito", 13.36]], null, null, null, null, null, null], "duration": [1.7, 7.73, 3.5, 7.07, 7.31, 5.02, 2.68, 2.17, 0.68, 0.45, 1.1, 1.57, 1.22, 1.9, 16.97, 5.74, 6.19, 3.49, 6.67, 7.16, 19.33, 8.02, 2.16, 1.36, 0.13, 1.37, 18.93, 2.05, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/0c-UIkfsk1U_filtered.json b/annotations_filtered/0c-UIkfsk1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aebc7752e58bf5f9761d8addcf3c402dab1cc01 --- /dev/null +++ b/annotations_filtered/0c-UIkfsk1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.41], [24.0, 23.79], [26.0, 26.28], [32.0, 33.05], [42.0, 42.45], [43.0, 43.53], [44.0, 44.44], [48.0, 48.37], [49.0, 50.21], [57.0, 57.08], [59.0, 59.26], [63.0, 64.07], [66.0, 74.82], [79.0, 79.84], [81.0, 92.04], [95.0, 98.83], [101.0, 101.22], [104.0, 107.35], [109.0, 110.4], [112.0, 120.48], [123.0, 129.59], [131.0, 131.06], [132.0, 133.08], [139.0, 139.29], [144.0, 144.95], [146.0, 147.5], [158.0, 159.38], [160.0, 160.41], [161.0, 161.37], [162.0, 162.57], [163.0, 163.8], [166.0, 166.11], [167.0, 170.14], [171.0, 172.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.41, 0.0, 31.22, 99.36, 0.0, 99.99, 0.0, 99.4, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.12], ["whack, thwack", 17.23], ["speech", 9.5]], null, [["whack, thwack", 45.17], ["speech", 5.89], ["sound effect", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, -0.21, 0.28, 1.05, 0.45, 0.53, 0.44, 0.37, 1.21, 0.08, 0.26, 1.07, 8.82, 0.84, 11.04, 3.83, 0.22, 3.35, 1.4, 8.48, 6.59, 0.06, 1.08, 0.29, 0.95, 1.5, 1.38, 0.41, 0.37, 0.57, 0.8, 0.11, 3.14, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/0cHePp1_EMg_filtered.json b/annotations_filtered/0cHePp1_EMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a5ac106aad848ed80a8e99fc99dcc3ad1055c10 --- /dev/null +++ b/annotations_filtered/0cHePp1_EMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.05], [8.0, 8.04], [11.0, 11.62], [12.0, 24.93], [26.0, 27.41], [28.0, 28.78], [30.0, 30.11], [31.0, 30.97], [32.0, 32.34], [38.0, 39.73], [40.0, 42.06], [46.0, 45.74], [46.0, 49.42], [50.0, 51.06], [52.0, 51.93], [53.0, 54.23], [55.0, 55.32], [59.0, 60.18], [61.0, 62.7], [64.0, 65.89], [81.0, 81.46], [82.0, 83.47], [86.0, 108.43], [114.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 65.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.05, 0.04, 0.62, 12.93, 1.41, 0.78, 0.11, -0.03, 0.34, 1.73, 2.06, -0.26, 3.42, 1.06, -0.07, 1.23, 0.32, 1.18, 1.7, 1.89, 0.46, 1.47, 22.43, 16.94]} \ No newline at end of file diff --git a/annotations_filtered/0cPT4zspVc0_filtered.json b/annotations_filtered/0cPT4zspVc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308a6c133cd2ca29e51e6174a1700fc9378b857e --- /dev/null +++ b/annotations_filtered/0cPT4zspVc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [7.0, 11.28], [15.0, 15.9], [20.0, 20.65], [23.0, 23.65], [24.0, 34.18], [36.0, 36.71], [40.0, 39.77], [41.0, 41.45], [48.0, 53.5], [64.0, 67.78], [70.0, 74.6], [78.0, 95.77], [96.0, 97.26], [98.0, 98.58], [99.0, 101.39], [104.0, 109.07], [111.0, 119.85], [123.0, 123.38], [142.0, 147.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 30.33, 0.0, 0.0, 0.0, 31.12, 0.0, 0.0, 0.0, 29.32, 29.36, 29.74, 31.75, 0.0, 0.0, 49.78, 47.54, 32.07, 0.0, 29.18], "audiomae_on_audioset": [null, [["music", 40.53], ["throbbing", 29.76], ["hum", 14.35]], null, null, null, [["speech", 82.41], ["hum", 2.46], ["throbbing", 1.84]], null, null, null, [["groan", 23.97], ["speech", 22.72], ["music", 16.71]], [["vehicle", 14.7], ["groan", 11.14], ["animal", 7.34]], [["music", 32.75], ["speech", 7.39], ["groan", 6.83]], [["music", 47.86], ["speech", 14.16], ["noise", 4.35]], null, null, [["speech", 82.97], ["music", 10.57], ["fart", 1.44]], [["speech", 37.91], ["sidetone", 14.43], ["hum", 9.11]], [["electric shaver, electric razor", 29.74], ["mains hum", 28.5], ["hum", 24.71]], null, [["mains hum", 30.03], ["speech", 17.1], ["electric shaver, electric razor", 17.01]]], "duration": [1.21, 4.28, 0.9, 0.65, 0.65, 10.18, 0.71, -0.23, 0.45, 5.5, 3.78, 4.6, 17.77, 1.26, 0.58, 2.39, 5.07, 8.85, 0.38, 5.45]} \ No newline at end of file diff --git a/annotations_filtered/0dlFAtbte0c_filtered.json b/annotations_filtered/0dlFAtbte0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7648c0e699ad18f077312010ac1ee5fecb80fc26 --- /dev/null +++ b/annotations_filtered/0dlFAtbte0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.59], [2.0, 2.51]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [-0.41, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/0eC9f13FIJ0_filtered.json b/annotations_filtered/0eC9f13FIJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7f80e3d3453e84bae7f3f3b5d1f62fdcd1b2248 --- /dev/null +++ b/annotations_filtered/0eC9f13FIJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.12], [25.0, 26.3], [28.0, 28.73], [33.0, 36.73], [39.0, 39.12], [40.0, 41.17], [42.0, 42.62], [47.0, 47.28], [51.0, 51.04], [55.0, 58.19], [67.0, 67.64], [69.0, 69.35], [70.0, 69.92], [80.0, 80.72], [85.0, 87.03], [88.0, 106.34], [109.0, 110.62], [111.0, 112.43], [114.0, 114.44], [117.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 0.0, 0.0, 0.0, 65.44, 47.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.88], ["musical instrument", 6.29], ["synthesizer", 4.45]], null, null, null, null], "duration": [1.12, 1.3, 0.73, 3.73, 0.12, 1.17, 0.62, 0.28, 0.04, 3.19, 0.64, 0.35, -0.08, 0.72, 2.03, 18.34, 1.62, 1.43, 0.44, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/0eJpmeoLXLg_filtered.json b/annotations_filtered/0eJpmeoLXLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9354eb95d3eb349157913163eb61dd342b494492 --- /dev/null +++ b/annotations_filtered/0eJpmeoLXLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [6.0, 5.68], [6.0, 5.75], [6.0, 12.72], [24.0, 25.25], [37.0, 37.94], [38.0, 39.8], [71.0, 71.79]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.64, -0.32, -0.25, 6.72, 1.25, 0.94, 1.8, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/0ePC0mh4rCY_filtered.json b/annotations_filtered/0ePC0mh4rCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fd920c5073072f9c6118e9a2ecde0ebd0c334c7 --- /dev/null +++ b/annotations_filtered/0ePC0mh4rCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.22], [2.0, 2.2], [3.0, 3.37], [4.0, 4.5], [5.0, 10.03], [13.0, 18.64], [19.0, 18.67], [19.0, 18.71], [19.0, 18.74], [19.0, 21.98], [23.0, 23.21], [24.0, 24.22], [27.0, 27.7], [29.0, 49.11], [49.0, 50.21], [55.0, 55.07], [57.0, 57.18], [58.0, 58.01], [59.0, 59.14], [60.0, 60.61], [61.0, 63.86], [64.0, 64.52], [74.0, 91.17], [95.0, 96.25], [100.0, 99.71], [102.0, 102.12], [103.0, 104.13], [107.0, 110.59], [112.0, 112.94], [113.0, 112.97]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.73, 30.05, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 0.0, 32.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 0.0, 37.17, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 40.91], ["livestock, farm animals, working animals", 13.28], ["cattle, bovinae", 10.73]], [["music", 67.85], ["speech", 6.4], ["mosquito", 5.99]], null, null, null, [["electric shaver, electric razor", 34.81], ["cattle, bovinae", 20.04], ["speech", 12.07]], null, null, null, [["livestock, farm animals, working animals", 53.53], ["buzz", 10.25], ["cattle, bovinae", 6.93]], null, null, null, null, null, null, [["speech", 57.68], ["fly, housefly", 4.58], ["insect", 3.5]], null, [["beatboxing", 14.03], ["mosquito", 13.18], ["noise", 12.99]], null, null, null, null, [["livestock, farm animals, working animals", 25.27], ["fly, housefly", 19.78], ["insect", 9.92]], null, null], "duration": [1.22, 0.2, 0.37, 0.5, 5.03, 5.64, -0.33, -0.29, -0.26, 2.98, 0.21, 0.22, 0.7, 20.11, 1.21, 0.07, 0.18, 0.01, 0.14, 0.61, 2.86, 0.52, 17.17, 1.25, -0.29, 0.12, 1.13, 3.59, 0.94, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/0eQBa4JQzDI_filtered.json b/annotations_filtered/0eQBa4JQzDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1921248717362331032472a4d6eedca4edbb5662 --- /dev/null +++ b/annotations_filtered/0eQBa4JQzDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [3.0, 3.08], [3.0, 7.87], [8.0, 10.32], [13.0, 21.91], [26.0, 27.84], [29.0, 32.32], [33.0, 34.75], [35.0, 38.91], [41.0, 41.37], [42.0, 42.42], [44.0, 43.93], [45.0, 46.25], [48.0, 49.55], [52.0, 52.73], [53.0, 54.3], [56.0, 56.66], [57.0, 57.72], [58.0, 60.52], [62.0, 63.58], [64.0, 66.51], [67.0, 68.88], [72.0, 76.45], [78.0, 78.8], [79.0, 79.54], [80.0, 81.53], [82.0, 82.59], [85.0, 89.77], [92.0, 92.25], [94.0, 94.44], [95.0, 95.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 99.99, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 98.99, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 0.08, 4.87, 2.32, 8.91, 1.84, 3.32, 1.75, 3.91, 0.37, 0.42, -0.07, 1.25, 1.55, 0.73, 1.3, 0.66, 0.72, 2.52, 1.58, 2.51, 1.88, 4.45, 0.8, 0.54, 1.53, 0.59, 4.77, 0.25, 0.44, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/0ekAvNp_F9c_filtered.json b/annotations_filtered/0ekAvNp_F9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ba935e339bc6c30eb598b490fb975d6c92dc35f --- /dev/null +++ b/annotations_filtered/0ekAvNp_F9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [8.0, 9.07], [10.0, 10.34], [13.0, 14.03], [16.0, 17.02], [18.0, 20.65], [22.0, 22.4], [24.0, 23.79], [29.0, 29.73], [31.0, 32.66], [39.0, 39.6], [41.0, 41.5], [49.0, 52.68], [57.0, 58.48], [64.0, 66.12], [79.0, 80.13], [86.0, 88.33], [96.0, 100.7], [102.0, 112.11], [113.0, 113.31], [114.0, 152.49], [153.0, 152.86], [154.0, 162.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 72.75, 0.0, 73.21, 36.07, 32.96, 0.0, 0.0, 0.0, 29.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.78], ["singing bowl", 22.86], ["speech", 22.05]], null, null, null, null, [["music", 55.35], ["electronic music", 5.92], ["sonar", 4.85]], [["hum", 31.75], ["music", 28.14], ["gong", 9.61]], null, null, null, [["music", 41.49], ["speech", 11.54], ["scary music", 7.45]]], "duration": [1.0, 1.07, 0.34, 1.03, 1.02, 2.65, 0.4, -0.21, 0.73, 1.66, 0.6, 0.5, 3.68, 1.48, 2.12, 1.13, 2.33, 4.7, 10.11, 0.31, 38.49, -0.14, 8.36]} \ No newline at end of file diff --git a/annotations_filtered/0en0UJ180yc_filtered.json b/annotations_filtered/0en0UJ180yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f29574be5e5c83b043554de5ced3baf146968ac1 --- /dev/null +++ b/annotations_filtered/0en0UJ180yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [6.0, 7.55], [13.0, 13.76], [17.0, 21.59], [25.0, 36.71], [41.0, 46.5], [50.0, 86.95], [87.0, 87.44], [87.0, 90.91], [93.0, 104.94]], "keep_status": [false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 37.81, 31.89, 31.67, 0.0, 0.0, 31.83, 31.69], "audiomae_on_audioset": [null, null, null, [["radio", 21.07], ["hum", 16.61], ["throbbing", 13.87]], [["speech", 51.86], ["artillery fire", 12.55], ["explosion", 4.58]], [["speech", 71.44], ["explosion", 6.08], ["artillery fire", 5.36]], null, null, [["speech", 59.49], ["radio", 14.35], ["sidetone", 8.74]], [["music", 12.34], ["hum", 10.07], ["cacophony", 8.5]]], "duration": [1.38, 1.55, 0.76, 4.59, 11.71, 5.5, 36.95, 0.44, 3.91, 11.94]} \ No newline at end of file diff --git a/annotations_filtered/0ezPVizHpY0_filtered.json b/annotations_filtered/0ezPVizHpY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7641e1bb1bb46053e22775883592bdce1260b3d --- /dev/null +++ b/annotations_filtered/0ezPVizHpY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.69], [29.0, 29.84], [31.0, 31.83], [33.0, 55.41], [57.0, 104.84], [118.0, 119.04], [120.0, 120.16], [121.0, 153.0], [155.0, 184.99]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.14, 0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, [["hum", 49.78], ["music", 11.11], ["throbbing", 10.5]], null, null, null, null, [["music", 40.94], ["speech", 18.86], ["fart", 18.42]]], "duration": [1.69, 0.84, 0.83, 22.41, 47.84, 1.04, 0.16, 32.0, 29.99]} \ No newline at end of file diff --git a/annotations_filtered/0f2bU9SzCzs_filtered.json b/annotations_filtered/0f2bU9SzCzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..927959aae227f473812207f7edd405c338d0708a --- /dev/null +++ b/annotations_filtered/0f2bU9SzCzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.34], [19.0, 19.65], [26.0, 26.59], [33.0, 33.15], [35.0, 35.7], [41.0, 41.98], [43.0, 44.66], [46.0, 47.24], [48.0, 49.13], [50.0, 51.38], [54.0, 72.99], [77.0, 111.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sidetone", 59.08], ["music", 16.0], ["speech", 13.05]], null], "duration": [8.34, 0.65, 0.59, 0.15, 0.7, 0.98, 1.66, 1.24, 1.13, 1.38, 18.99, 34.25]} \ No newline at end of file diff --git a/annotations_filtered/0fBA7VUZEgY_filtered.json b/annotations_filtered/0fBA7VUZEgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..264a39c53228190d370608dede19c727bfe47148 --- /dev/null +++ b/annotations_filtered/0fBA7VUZEgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 4.99], [9.0, 10.93], [15.0, 16.31], [20.0, 23.92], [28.0, 29.67], [31.0, 31.8], [32.0, 33.22], [36.0, 38.31], [39.0, 40.51], [51.0, 52.14], [56.0, 58.23], [60.0, 61.05], [62.0, 62.55], [64.0, 65.03], [67.0, 70.23], [71.0, 73.79], [75.0, 76.22], [77.0, 119.5], [120.0, 121.8], [122.0, 123.15], [125.0, 126.67], [127.0, 129.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.59, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 81.17, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9], "audiomae_on_audioset": [null, null, null, null, [["speech", 66.8], ["fart", 21.35], ["electric shaver, electric razor", 2.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.82], ["fireworks", 3.53], ["music", 2.45]]], "duration": [0.08, 0.99, 1.93, 1.31, 3.92, 1.67, 0.8, 1.22, 2.31, 1.51, 1.14, 2.23, 1.05, 0.55, 1.03, 3.23, 2.79, 1.22, 42.5, 1.8, 1.15, 1.67, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/0fTXzdHoip8_filtered.json b/annotations_filtered/0fTXzdHoip8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97751925e82a7b3b91d30435082ba729b92aaa59 --- /dev/null +++ b/annotations_filtered/0fTXzdHoip8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.87], [41.0, 42.84], [45.0, 48.98], [49.0, 50.95], [52.0, 52.74], [54.0, 55.92], [58.0, 59.31], [62.0, 71.83], [72.0, 73.53], [75.0, 110.24], [112.0, 148.68], [151.0, 156.84], [157.0, 157.94], [159.0, 160.27], [161.0, 161.97]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.65, 0.0, 0.0, 0.0, 0.0, 34.75, 0.0, 0.0, 0.0, 31.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 83.13], ["telephone", 4.94], ["dial tone", 4.02]], null, null, null, null, [["speech", 30.04], ["animal", 10.81], ["hum", 6.12]], null, null, null, [["speech", 24.94], ["sine wave", 13.81], ["whimper", 10.1]], null, null, null], "duration": [1.87, 1.84, 3.98, 1.95, 0.74, 1.92, 1.31, 9.83, 1.53, 35.24, 36.68, 5.84, 0.94, 1.27, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/0fbR1RvOCQA_filtered.json b/annotations_filtered/0fbR1RvOCQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61745f8b77a539f6b7e78bc94f809f3bd5c325fc --- /dev/null +++ b/annotations_filtered/0fbR1RvOCQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [6.0, 6.42], [7.0, 7.84], [9.0, 12.09], [13.0, 14.25], [15.0, 16.9], [19.0, 18.96], [20.0, 20.98], [27.0, 28.04], [33.0, 33.0], [37.0, 37.89], [39.0, 39.78], [41.0, 42.65], [54.0, 55.98], [58.0, 59.54], [60.0, 61.18], [62.0, 62.88], [64.0, 64.84], [67.0, 71.04], [73.0, 82.12], [84.0, 86.68], [88.0, 88.5]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.22, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.18, 37.38, 40.47, 0.0], "audiomae_on_audioset": [[["chirp tone", 16.63], ["sine wave", 16.02], ["whale vocalization", 11.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.12], ["speech", 37.15], ["inside, small room", 0.91]], [["hum", 44.72], ["throbbing", 30.91], ["music", 7.01]], null], "duration": [2.21, 0.42, 0.84, 3.09, 1.25, 1.9, -0.04, 0.98, 1.04, 0.0, 0.89, 0.78, 1.65, 1.98, 1.54, 1.18, 0.88, 0.84, 4.04, 9.12, 2.68, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/0foXV1hWrx4_filtered.json b/annotations_filtered/0foXV1hWrx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48cbb23a3ce65256a21e83270e37d78ee79b1614 --- /dev/null +++ b/annotations_filtered/0foXV1hWrx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [6.0, 27.45], [28.0, 28.93], [32.0, 37.83], [39.0, 41.22], [46.0, 54.99], [57.0, 60.78], [61.0, 62.58], [64.0, 85.46], [88.0, 97.33], [99.0, 102.56], [107.0, 109.7], [111.0, 113.68], [116.0, 116.73], [118.0, 119.55], [121.0, 122.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 99.99, 97.22, 100.0, 50.66, 98.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 21.45, 0.93, 5.83, 2.22, 8.99, 3.78, 1.58, 21.46, 9.33, 3.56, 2.7, 2.68, 0.73, 1.55, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/0fwudBWsw9Q_filtered.json b/annotations_filtered/0fwudBWsw9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c131c2977a4cb4cdec4368201532a80897d04433 --- /dev/null +++ b/annotations_filtered/0fwudBWsw9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 20.38], [22.0, 26.79], [32.0, 36.26], [37.0, 37.96], [40.0, 40.9], [42.0, 43.14], [44.0, 44.86], [52.0, 52.51], [53.0, 54.03], [55.0, 55.34], [56.0, 56.37], [59.0, 60.96], [62.0, 62.7], [66.0, 66.77], [70.0, 70.41], [70.0, 70.9], [73.0, 72.84], [73.0, 74.71], [79.0, 79.61], [80.0, 80.76], [81.0, 82.46], [84.0, 85.04], [87.0, 87.66], [89.0, 90.29], [91.0, 91.03], [93.0, 93.7], [95.0, 95.0], [99.0, 99.89], [107.0, 107.06], [108.0, 108.65], [111.0, 111.92], [117.0, 117.81], [118.0, 119.64], [125.0, 124.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.09, 38.19, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.5], ["musical instrument", 7.55], ["speech", 6.92]], [["animal", 27.73], ["dog", 18.96], ["domestic animals, pets", 14.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.38, 4.79, 4.26, 0.96, 0.9, 1.14, 0.86, 0.51, 1.03, 0.34, 0.37, 1.96, 0.7, 0.77, 0.41, 0.9, -0.16, 1.71, 0.61, 0.76, 1.46, 1.04, 0.66, 1.29, 0.03, 0.7, 0.0, 0.89, 0.06, 0.65, 0.92, 0.81, 1.64, -0.25]} \ No newline at end of file diff --git a/annotations_filtered/0g2o-CfakW0_filtered.json b/annotations_filtered/0g2o-CfakW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b920f7a7e1c8ff05a8f2c44d2bf17a056c89608d --- /dev/null +++ b/annotations_filtered/0g2o-CfakW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [5.0, 5.58], [6.0, 6.91], [7.0, 8.04], [10.0, 18.05], [19.0, 20.6], [22.0, 21.91], [23.0, 24.95], [28.0, 30.38], [33.0, 33.71], [34.0, 34.97], [36.0, 36.26], [37.0, 38.62], [40.0, 42.62], [44.0, 44.54], [46.0, 45.86], [47.0, 47.04], [48.0, 65.2], [67.0, 67.04], [68.0, 68.54], [69.0, 70.23], [73.0, 73.8], [76.0, 77.77], [79.0, 81.57], [82.0, 83.61], [85.0, 85.56], [86.0, 86.78], [87.0, 87.34], [88.0, 88.7], [89.0, 90.21], [91.0, 92.21], [95.0, 95.64], [96.0, 96.85], [97.0, 97.93], [98.0, 100.21], [101.0, 102.25], [103.0, 110.02], [111.0, 115.86], [117.0, 120.73], [125.0, 124.85], [126.0, 126.15], [127.0, 130.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.71, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.28, 0.0, 53.34, 39.17, 36.32, 0.0, 0.0, 38.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.96], ["creak", 5.63], ["whale vocalization", 2.44]], null, null, [["speech", 58.25], ["music", 14.96], ["mains hum", 1.83]], [["music", 20.36], ["hum", 12.12], ["speech", 10.9]], null, null, [["mains hum", 16.88], ["hum", 16.38], ["music", 14.62]]], "duration": [0.87, 0.58, 0.91, 1.04, 8.05, 1.6, -0.09, 1.95, 2.38, 0.71, 0.97, 0.26, 1.62, 2.62, 0.54, -0.14, 0.04, 17.2, 0.04, 0.54, 1.23, 0.8, 1.77, 2.57, 1.61, 0.56, 0.78, 0.34, 0.7, 1.21, 1.21, 0.64, 0.85, 0.93, 2.21, 1.25, 7.02, 4.86, 3.73, -0.15, 0.15, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/0gAMfKzCJsc_filtered.json b/annotations_filtered/0gAMfKzCJsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0efc97f210055be1280405499de3851cb8b2d51 --- /dev/null +++ b/annotations_filtered/0gAMfKzCJsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.74], [19.0, 20.56], [21.0, 26.57], [29.0, 30.77], [35.0, 35.61], [38.0, 39.16], [42.0, 47.06], [54.0, 55.0], [59.0, 60.02], [60.0, 60.4], [67.0, 76.96], [100.0, 102.44], [105.0, 111.11], [113.0, 113.53], [115.0, 115.57], [116.0, 118.32], [123.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [100.0, 0.0, 77.53, 0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 38.58, 45.08, 30.17, 0.0, 0.0, 93.76, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.88], ["speech", 37.11], ["inside, large room or hall", 1.41]], null, null, null, [["speech", 49.01], ["music", 13.47], ["fireworks", 4.1]], [["music", 55.27], ["synthesizer", 9.72], ["foghorn", 4.24]], [["music", 67.73], ["breaking", 6.76], ["thump, thud", 5.34]], null, null, null, null], "duration": [2.74, 1.56, 5.57, 1.77, 0.61, 1.16, 5.06, 1.0, 1.02, 0.4, 9.96, 2.44, 6.11, 0.53, 0.57, 2.32, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/0gBKE5MUiQc_filtered.json b/annotations_filtered/0gBKE5MUiQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b49465c4868621e221b78fcdb758600d3e62a1f9 --- /dev/null +++ b/annotations_filtered/0gBKE5MUiQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.98], [22.0, 26.59], [29.0, 35.92], [38.0, 38.89], [39.0, 40.26], [47.0, 47.16], [54.0, 56.22], [57.0, 58.24], [58.0, 58.28], [61.0, 61.38], [65.0, 69.9], [75.0, 75.79], [78.0, 78.68], [97.0, 97.78], [100.0, 105.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.97, 51.02, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 31.39], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 31.76], ["cattle, bovinae", 24.54], ["moo", 21.07]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.65], ["thunk", 24.95], ["sound effect", 6.43]]], "duration": [0.98, 4.59, 6.92, 0.89, 1.26, 0.16, 2.22, 1.24, 0.28, 0.38, 4.9, 0.79, 0.68, 0.78, 5.8]} \ No newline at end of file diff --git a/annotations_filtered/0h0FeEzxCaM_filtered.json b/annotations_filtered/0h0FeEzxCaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c43ed34220ceaa5113b8326389d87bacfa304a94 --- /dev/null +++ b/annotations_filtered/0h0FeEzxCaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 57.99], [60.0, 63.49], [65.0, 86.58], [88.0, 88.42], [89.0, 94.29], [95.0, 95.81], [97.0, 97.88], [99.0, 99.45], [100.0, 114.84], [115.0, 124.09], [124.0, 128.12], [128.0, 196.53]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 47.31, 31.52, 0.0, 40.88, 0.0, 0.0, 0.0, 32.29, 35.03, 51.07, 0.0], "audiomae_on_audioset": [null, [["music", 69.99], ["hum", 5.14], ["electronic music", 3.66]], [["mains hum", 33.39], ["music", 30.24], ["hum", 18.71]], null, [["sine wave", 19.41], ["speech", 17.53], ["tuning fork", 3.99]], null, null, null, [["fly, housefly", 15.51], ["speech", 8.33], ["insect", 7.51]], [["fly, housefly", 24.94], ["insect", 16.43], ["hum", 12.29]], null, null], "duration": [56.99, 3.49, 21.58, 0.42, 5.29, 0.81, 0.88, 0.45, 14.84, 9.09, 4.12, 68.53]} \ No newline at end of file diff --git a/annotations_filtered/0h0S6EmQWrI_filtered.json b/annotations_filtered/0h0S6EmQWrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a04f853a749d0db4cbaca01b4bf05f75ffb5d152 --- /dev/null +++ b/annotations_filtered/0h0S6EmQWrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [15.0, 36.17], [38.0, 91.42], [96.0, 100.99], [102.0, 102.42], [103.0, 103.2], [108.0, 118.57], [121.0, 121.78], [122.0, 121.83], [122.0, 123.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.71, 0.0, 31.02, 0.0, 0.0, 30.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 41.03], ["music", 29.53], ["hum", 21.25]], null, [["whale vocalization", 68.18], ["music", 13.5], ["noise", 3.38]], null, null, [["music", 66.94], ["throbbing", 7.62], ["electronic music", 6.26]], null, null, null], "duration": [0.88, 21.17, 53.42, 4.99, 0.42, 0.2, 10.57, 0.78, -0.17, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/0hL-fpCsGR8_filtered.json b/annotations_filtered/0hL-fpCsGR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e9df6cc83c9afa257006e8e07c030087790a8c --- /dev/null +++ b/annotations_filtered/0hL-fpCsGR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.27], [20.0, 25.2], [27.0, 33.29], [34.0, 36.05], [37.0, 43.33], [46.0, 56.32], [57.0, 64.52], [65.0, 67.49], [69.0, 92.8], [94.0, 101.76], [103.0, 110.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.16, 99.21, 99.4, 98.8, 96.29, 90.08, 95.09, 87.37, 91.64, 85.35, 52.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [5.27, 5.2, 6.29, 2.05, 6.33, 10.32, 7.52, 2.49, 23.8, 7.76, 7.34]} \ No newline at end of file diff --git a/annotations_filtered/0hNbRd78jOE_filtered.json b/annotations_filtered/0hNbRd78jOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb63a5fa9d2d8a852360f56a2342353e7050669c --- /dev/null +++ b/annotations_filtered/0hNbRd78jOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [8.0, 9.05], [12.0, 11.84], [20.0, 20.39], [28.0, 31.65], [33.0, 33.34], [37.0, 37.37], [41.0, 41.81], [46.0, 46.89], [49.0, 49.71], [52.0, 53.38], [56.0, 57.16], [59.0, 59.56], [65.0, 70.07], [72.0, 72.84], [74.0, 76.0], [78.0, 78.75], [81.0, 85.58], [92.0, 93.38], [93.0, 94.53], [99.0, 99.76], [101.0, 103.08], [105.0, 105.6], [108.0, 109.46], [110.0, 111.87], [114.0, 114.15], [121.0, 122.08], [122.0, 123.36], [125.0, 125.29], [126.0, 126.45], [129.0, 131.73], [136.0, 137.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 0.0, 35.85, 0.0, 37.99, 0.0, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0], "audiomae_on_audioset": [null, null, null, null, [["moo", 36.0], ["cattle, bovinae", 32.17], ["livestock, farm animals, working animals", 28.38]], null, null, null, null, null, null, null, null, null, null, [["speech", 34.76], ["crowd", 8.95], ["fireworks", 4.79]], null, [["speech", 33.16], ["music", 15.6], ["boing", 9.01]], null, null, null, [["moo", 23.19], ["speech", 22.48], ["cattle, bovinae", 15.64]], null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.05, -0.16, 0.39, 3.65, 0.34, 0.37, 0.81, 0.89, 0.71, 1.38, 1.16, 0.56, 5.07, 0.84, 2.0, 0.75, 4.58, 1.38, 1.53, 0.76, 2.08, 0.6, 1.46, 1.87, 0.15, 1.08, 1.36, 0.29, 0.45, 2.73, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/0hau_p3N-MI_filtered.json b/annotations_filtered/0hau_p3N-MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d64af465acb5460e880f012ce4c46cde6cb8ff46 --- /dev/null +++ b/annotations_filtered/0hau_p3N-MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.6], [12.0, 12.58], [17.0, 17.83], [42.0, 42.43], [43.0, 43.93], [45.0, 45.47], [46.0, 46.57], [52.0, 52.07], [54.0, 57.87], [61.0, 61.57], [64.0, 68.07], [69.0, 76.17], [78.0, 81.73], [87.0, 87.99], [94.0, 123.11]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.84, 0.0, 91.81, 97.92, 96.66, 0.0, 33.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 42.33], ["music", 17.04], ["foghorn", 5.43]], null, null, null, null, null, [["music", 42.94], ["didgeridoo", 9.58], ["theremin", 8.92]]], "duration": [3.6, 0.58, 0.83, 0.43, 0.93, 0.47, 0.57, 0.07, 3.87, 0.57, 4.07, 7.17, 3.73, 0.99, 29.11]} \ No newline at end of file diff --git a/annotations_filtered/0iUKZskQEso_filtered.json b/annotations_filtered/0iUKZskQEso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80b742f63450fb0df3482ac16dcc80d308bd23de --- /dev/null +++ b/annotations_filtered/0iUKZskQEso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.96], [52.0, 52.2], [64.0, 65.01], [83.0, 97.55], [103.0, 103.18], [121.0, 121.9], [139.0, 165.86], [173.0, 174.04], [179.0, 179.85]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.99, 0.0, 0.0, 47.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 83.9], ["quack", 4.29], ["bleat", 1.55]], null, null, [["cattle, bovinae", 35.97], ["moo", 34.15], ["livestock, farm animals, working animals", 21.9]], null, null], "duration": [-0.04, 0.2, 1.01, 14.55, 0.18, 0.9, 26.86, 1.04, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/0igqAlu8Oqc_filtered.json b/annotations_filtered/0igqAlu8Oqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e0b55a7b54dafa480c5f2366bab572e7e930981 --- /dev/null +++ b/annotations_filtered/0igqAlu8Oqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.25], [22.0, 23.43], [29.0, 29.81], [46.0, 46.53], [49.0, 50.67], [62.0, 62.94], [68.0, 68.0], [70.0, 75.25], [76.0, 77.03], [83.0, 84.06], [91.0, 91.08], [92.0, 92.33], [96.0, 105.29], [114.0, 124.44], [134.0, 136.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 34.32, 36.7, 52.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.92], ["explosion", 24.06], ["music", 20.63]], [["speech", 68.48], ["music", 15.67], ["sidetone", 2.96]], null], "duration": [1.25, 1.43, 0.81, 0.53, 1.67, 0.94, 0.0, 5.25, 1.03, 1.06, 0.08, 0.33, 9.29, 10.44, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/0isiQvOb874_filtered.json b/annotations_filtered/0isiQvOb874_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e538d70bc4ad214816b7e77c7941934528b12589 --- /dev/null +++ b/annotations_filtered/0isiQvOb874_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.21], [14.0, 15.89], [18.0, 19.43], [20.0, 20.73], [23.0, 23.53], [24.0, 24.9], [26.0, 27.36], [33.0, 35.7], [50.0, 50.57], [53.0, 53.64], [62.0, 62.38], [65.0, 65.11], [65.0, 65.75], [66.0, 68.35]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 0.0, 0.0, 35.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 21.88], ["mains hum", 15.43], ["music", 13.6]], null, null, null, null, null, [["music", 28.93], ["speech", 11.16], ["vehicle", 4.99]]], "duration": [1.21, 1.89, 1.43, 0.73, 0.53, 0.9, 1.36, 2.7, 0.57, 0.64, 0.38, 0.11, 0.75, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/0j9yDnytwPU_filtered.json b/annotations_filtered/0j9yDnytwPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f7537daaaeded571430a3e1bc62652c7034911f --- /dev/null +++ b/annotations_filtered/0j9yDnytwPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.05], [17.0, 18.32], [19.0, 19.94], [22.0, 22.05], [24.0, 27.03], [28.0, 28.83], [31.0, 33.99], [35.0, 35.77], [39.0, 39.97], [41.0, 41.49], [43.0, 45.4], [46.0, 49.94], [51.0, 51.58], [53.0, 58.14], [59.0, 62.07], [63.0, 66.93], [68.0, 89.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 0.0, 100.0, 99.98, 0.0, 100.0, 99.91, 100.0, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.05, 1.32, 0.94, 0.05, 3.03, 0.83, 2.99, 0.77, 0.97, 0.49, 2.4, 3.94, 0.58, 5.14, 3.07, 3.93, 21.46]} \ No newline at end of file diff --git a/annotations_filtered/0jSVwZ8w3C4_filtered.json b/annotations_filtered/0jSVwZ8w3C4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d87bc434a648010535c28d1f766df56063c72e92 --- /dev/null +++ b/annotations_filtered/0jSVwZ8w3C4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [5.0, 6.51], [8.0, 14.98], [20.0, 19.95], [21.0, 20.88], [22.0, 33.0], [34.0, 35.41], [37.0, 38.15], [41.0, 49.0], [54.0, 54.95], [58.0, 59.09], [61.0, 61.47], [62.0, 72.0], [72.0, 73.5], [75.0, 79.37], [81.0, 82.73], [92.0, 93.56], [95.0, 95.82], [97.0, 98.56], [99.0, 100.16], [102.0, 102.1], [103.0, 103.69], [109.0, 109.78], [123.0, 125.04], [125.0, 125.07], [125.0, 125.1], [125.0, 125.24], [125.0, 125.36], [125.0, 125.49], [126.0, 126.54], [133.0, 133.86], [137.0, 139.4], [141.0, 141.45], [143.0, 144.46], [147.0, 147.85], [150.0, 150.67], [152.0, 153.81], [155.0, 155.49], [161.0, 161.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.68, 0.0, 0.0, 98.27, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 56.48, 0.0, 53.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.51, 6.98, -0.05, -0.12, 11.0, 1.41, 1.15, 8.0, 0.95, 1.09, 0.47, 10.0, 1.5, 4.37, 1.73, 1.56, 0.82, 1.56, 1.16, 0.1, 0.69, 0.78, 2.04, 0.07, 0.1, 0.24, 0.36, 0.49, 0.54, 0.86, 2.4, 0.45, 1.46, 0.85, 0.67, 1.81, 0.49, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/0jTSJ6NK6-4_filtered.json b/annotations_filtered/0jTSJ6NK6-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35879829a9b931844e9ad065e5233193cde3dd39 --- /dev/null +++ b/annotations_filtered/0jTSJ6NK6-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [11.0, 11.4], [20.0, 19.92], [22.0, 22.01], [23.0, 23.95], [26.0, 26.42], [33.0, 33.45], [34.0, 35.16], [36.0, 36.8], [40.0, 40.24], [44.0, 43.7], [44.0, 44.96], [47.0, 49.62], [54.0, 54.68], [56.0, 56.52], [58.0, 57.96], [58.0, 68.0], [72.0, 73.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 58.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.4, -0.08, 0.01, 0.95, 0.42, 0.45, 1.16, 0.8, 0.24, -0.3, 0.96, 2.62, 0.68, 0.52, -0.04, 10.0, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/0jxVnlRdelU_filtered.json b/annotations_filtered/0jxVnlRdelU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f0b62b8211363dc4c8b0506b07543d9261ae602 --- /dev/null +++ b/annotations_filtered/0jxVnlRdelU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [3.0, 3.86], [5.0, 5.8], [7.0, 7.45], [15.0, 21.37], [22.0, 22.2], [23.0, 26.67], [27.0, 28.75], [31.0, 30.99], [32.0, 35.48], [36.0, 46.65], [48.0, 50.73], [52.0, 52.56], [54.0, 55.29], [56.0, 57.28], [58.0, 60.05], [62.0, 67.74], [69.0, 69.04], [76.0, 78.39], [84.0, 85.48], [89.0, 89.19], [92.0, 92.74], [95.0, 96.69], [98.0, 100.06], [103.0, 103.44], [106.0, 106.81], [111.0, 114.32], [116.0, 116.23], [117.0, 117.56], [120.0, 120.68], [129.0, 129.2], [130.0, 131.11], [133.0, 133.24], [137.0, 139.13], [141.0, 141.59], [142.0, 143.11], [146.0, 147.46], [148.0, 148.64], [149.0, 151.7], [153.0, 161.45], [162.0, 165.33], [166.0, 172.42], [176.0, 176.69], [181.0, 184.57], [188.0, 189.77], [190.0, 200.18], [201.0, 205.87], [207.0, 211.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 76.86, 0.0, 0.0, 82.79, 86.45, 81.35, 0.0, 0.0, 0.0, 68.41, 89.54, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0, 0.0, 59.24, 70.72, 94.95, 76.04, 0.0, 87.19, 0.0, 66.76, 86.27, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 18.97], ["fly, housefly", 15.97], ["insect", 11.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 0.86, 0.8, 0.45, 6.37, 0.2, 3.67, 1.75, -0.01, 3.48, 10.65, 2.73, 0.56, 1.29, 1.28, 2.05, 5.74, 0.04, 2.39, 1.48, 0.19, 0.74, 1.69, 2.06, 0.44, 0.81, 3.32, 0.23, 0.56, 0.68, 0.2, 1.11, 0.24, 2.13, 0.59, 1.11, 1.46, 0.64, 2.7, 8.45, 3.33, 6.42, 0.69, 3.57, 1.77, 10.18, 4.87, 4.05]} \ No newline at end of file diff --git a/annotations_filtered/0jzYpSrpVqU_filtered.json b/annotations_filtered/0jzYpSrpVqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3f746833d5e4964bb046a15870f19ae778b08aa --- /dev/null +++ b/annotations_filtered/0jzYpSrpVqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.99], [8.0, 11.15], [11.0, 12.88], [15.0, 18.69], [21.0, 23.92], [24.0, 27.01], [27.0, 28.83], [30.0, 31.46], [33.0, 36.07], [37.0, 37.44], [39.0, 44.12], [47.0, 62.19], [63.0, 63.66], [65.0, 65.8], [67.0, 75.0], [82.0, 82.36], [84.0, 95.62], [96.0, 95.82], [96.0, 96.89], [106.0, 108.03], [115.0, 117.19], [119.0, 120.78], [122.0, 122.62], [123.0, 124.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 64.52, 0.0, 70.72, 65.55, 66.39, 0.0, 0.0, 63.53, 0.0, 47.74, 39.05, 0.0, 0.0, 34.74, 0.0, 34.65, 0.0, 0.0, 42.26, 34.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 55.87], ["effects unit", 10.23], ["musical instrument", 5.13]], [["music", 57.97], ["guitar", 5.3], ["musical instrument", 4.81]], null, null, [["music", 50.22], ["speech", 9.43], ["throbbing", 3.15]], null, [["music", 52.86], ["speech", 17.01], ["boing", 6.87]], null, null, [["music", 21.16], ["throbbing", 9.2], ["frog", 8.58]], [["moo", 25.02], ["cattle, bovinae", 19.32], ["music", 11.62]], null, null, null], "duration": [-0.01, 3.15, 1.88, 3.69, 2.92, 3.01, 1.83, 1.46, 3.07, 0.44, 5.12, 15.19, 0.66, 0.8, 8.0, 0.36, 11.62, -0.18, 0.89, 2.03, 2.19, 1.78, 0.62, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/0k8XW2V2dCg_filtered.json b/annotations_filtered/0k8XW2V2dCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0054340bd54193da7e7da7191b2389fefda528a5 --- /dev/null +++ b/annotations_filtered/0k8XW2V2dCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [5.0, 10.52], [14.0, 14.52], [19.0, 21.47], [23.0, 22.84], [24.0, 23.97], [26.0, 26.96], [28.0, 29.98], [32.0, 36.24], [38.0, 39.46], [41.0, 42.13], [43.0, 44.63], [48.0, 49.17], [50.0, 52.3], [53.0, 58.11], [60.0, 60.88], [65.0, 65.75], [69.0, 70.09], [74.0, 74.19], [75.0, 77.13], [82.0, 81.97], [83.0, 84.64], [87.0, 88.5], [95.0, 95.49], [97.0, 101.14], [102.0, 103.74], [115.0, 115.52]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.23, 0.0, 44.04, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 60.14, 72.16, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 27.13], ["insect", 16.21], ["buzz", 13.33]], null, [["frog", 12.48], ["sidetone", 11.01], ["hum", 7.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 5.52, 0.52, 2.47, -0.16, -0.03, 0.96, 1.98, 4.24, 1.46, 1.13, 1.63, 1.17, 2.3, 5.11, 0.88, 0.75, 1.09, 0.19, 2.13, -0.03, 1.64, 1.5, 0.49, 4.14, 1.74, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/0k_yjEiPLoc_filtered.json b/annotations_filtered/0k_yjEiPLoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d655308b574172dcf24d92d8a5f3244bd434dc61 --- /dev/null +++ b/annotations_filtered/0k_yjEiPLoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.46], [17.0, 23.16], [24.0, 24.83], [25.0, 26.28], [27.0, 32.04], [32.0, 33.94], [34.0, 35.67], [36.0, 38.57], [42.0, 43.46], [44.0, 45.37], [46.0, 48.22], [53.0, 54.41], [55.0, 55.76], [56.0, 56.47], [64.0, 64.88], [66.0, 65.87], [68.0, 68.08], [72.0, 73.18], [76.0, 96.94], [97.0, 113.29], [114.0, 131.55]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 41.07, 0.0, 0.0, 39.3, 0.0, 0.0, 44.32, 0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 32.97, 32.1], "audiomae_on_audioset": [null, [["domestic animals, pets", 18.21], ["dog", 17.27], ["animal", 13.9]], null, null, [["speech", 72.58], ["inside, small room", 2.6], ["heart sounds, heartbeat", 2.26]], null, null, [["hum", 51.22], ["mains hum", 36.66], ["speech", 5.17]], null, null, null, null, null, null, null, null, null, null, [["speech", 13.07], ["burst, pop", 10.52], ["music", 10.27]], [["sidetone", 28.42], ["busy signal", 23.37], ["music", 5.35]], [["fly, housefly", 20.84], ["insect", 14.55], ["mosquito", 12.42]]], "duration": [1.46, 6.16, 0.83, 1.28, 5.04, 1.94, 1.67, 2.57, 1.46, 1.37, 2.22, 1.41, 0.76, 0.47, 0.88, -0.13, 0.08, 1.18, 20.94, 16.29, 17.55]} \ No newline at end of file diff --git a/annotations_filtered/0kgLLa9gnsU_filtered.json b/annotations_filtered/0kgLLa9gnsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7df0219bb81331d9cddd147194500d3bf234ed3f --- /dev/null +++ b/annotations_filtered/0kgLLa9gnsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 23.16], [24.0, 25.57], [27.0, 27.21], [30.0, 30.43], [32.0, 32.61], [37.0, 37.89], [40.0, 40.1], [56.0, 57.1], [66.0, 68.27], [69.0, 70.38], [81.0, 81.55], [83.0, 84.42], [85.0, 85.4], [90.0, 90.24], [92.0, 92.62], [94.0, 94.78], [104.0, 104.67], [114.0, 121.12], [125.0, 124.68], [131.0, 131.38], [135.0, 135.09], [138.0, 138.69]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [41.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.39], ["speech", 9.34], ["throbbing", 6.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.48], ["explosion", 15.27], ["livestock, farm animals, working animals", 7.4]], null, null, null, null], "duration": [11.16, 1.57, 0.21, 0.43, 0.61, 0.89, 0.1, 1.1, 2.27, 1.38, 0.55, 1.42, 0.4, 0.24, 0.62, 0.78, 0.67, 7.12, -0.32, 0.38, 0.09, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/0klA5lTNwyY_filtered.json b/annotations_filtered/0klA5lTNwyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9ed0e7ea6f51e880d5fa9dd8098361cce5e978a --- /dev/null +++ b/annotations_filtered/0klA5lTNwyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.96], [16.0, 20.6], [22.0, 28.39], [29.0, 33.69], [35.0, 52.15], [55.0, 60.05], [61.0, 67.51], [68.0, 68.81], [71.0, 106.96], [107.0, 109.49], [111.0, 116.82], [118.0, 121.56], [123.0, 130.5], [131.0, 132.34], [133.0, 138.82], [140.0, 144.95], [146.0, 151.07], [152.0, 153.54], [154.0, 154.58], [156.0, 157.22], [159.0, 162.28], [165.0, 165.62], [167.0, 167.76], [169.0, 170.94], [173.0, 174.8], [176.0, 177.67], [179.0, 180.1], [181.0, 183.74], [185.0, 196.79], [198.0, 202.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 94.07, 86.09, 91.81, 82.07, 29.97, 30.53, 0.0, 0.0, 99.99, 100.0, 100.0, 99.65, 0.0, 99.44, 99.56, 96.66, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 89.54, 100.0], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 18.06], ["fart", 15.51], ["whack, thwack", 7.57]], [["speech", 46.4], ["music", 15.67], ["hum", 11.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.96, 4.6, 6.39, 4.69, 17.15, 5.05, 6.51, 0.81, 35.96, 2.49, 5.82, 3.56, 7.5, 1.34, 5.82, 4.95, 5.07, 1.54, 0.58, 1.22, 3.28, 0.62, 0.76, 1.94, 1.8, 1.67, 1.1, 2.74, 11.79, 4.66]} \ No newline at end of file diff --git a/annotations_filtered/0kqn9qQZdOs_filtered.json b/annotations_filtered/0kqn9qQZdOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..064041eb50c40603b6cb5c48458d4cd6bc8a9df6 --- /dev/null +++ b/annotations_filtered/0kqn9qQZdOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [7.0, 8.11], [9.0, 15.97], [20.0, 20.56]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 49.22, 0.0], "audiomae_on_audioset": [null, null, [["music", 43.03], ["theremin", 36.43], ["musical instrument", 3.86]], null], "duration": [1.39, 1.11, 6.97, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/0l5h8k9N9pI_filtered.json b/annotations_filtered/0l5h8k9N9pI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9e05d1749496930a22082742522b0746efc1b68 --- /dev/null +++ b/annotations_filtered/0l5h8k9N9pI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [4.0, 4.01], [5.0, 5.61], [8.0, 8.14], [9.0, 9.12], [10.0, 11.43], [14.0, 14.25], [15.0, 15.53], [18.0, 17.96], [19.0, 19.11], [21.0, 22.1], [31.0, 32.16], [33.0, 33.81], [37.0, 37.64], [39.0, 40.69], [43.0, 44.15], [45.0, 45.52], [55.0, 55.38], [58.0, 60.44], [62.0, 62.41], [64.0, 64.96], [66.0, 66.21], [68.0, 68.99], [73.0, 73.95], [76.0, 76.52], [78.0, 82.36], [84.0, 84.06], [86.0, 86.22], [93.0, 93.78], [94.0, 95.47], [97.0, 97.31], [99.0, 100.01], [101.0, 102.3], [104.0, 104.8], [106.0, 106.17], [108.0, 108.82], [111.0, 111.05], [113.0, 114.13], [117.0, 117.66], [121.0, 121.64], [123.0, 123.36], [125.0, 125.47], [131.0, 131.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.01, 0.61, 0.14, 0.12, 1.43, 0.25, 0.53, -0.04, 0.11, 1.1, 1.16, 0.81, 0.64, 1.69, 1.15, 0.52, 0.38, 2.44, 0.41, 0.96, 0.21, 0.99, 0.95, 0.52, 4.36, 0.06, 0.22, 0.78, 1.47, 0.31, 1.01, 1.3, 0.8, 0.17, 0.82, 0.05, 1.13, 0.66, 0.64, 0.36, 0.47, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/0l8mYfrxpTw_filtered.json b/annotations_filtered/0l8mYfrxpTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..643a0c71f4b323b2b971852c44a3a5c86faae5cf --- /dev/null +++ b/annotations_filtered/0l8mYfrxpTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 60.05], [68.0, 68.32], [90.0, 90.32], [103.0, 103.38], [104.0, 104.18], [134.0, 133.84], [137.0, 139.23], [157.0, 161.52], [163.0, 163.73], [164.0, 165.1], [166.0, 167.41], [170.0, 171.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.05, 30.59, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 79.09], ["speech synthesizer", 2.08], ["radio", 2.03]], [["speech", 66.16], ["sidetone", 7.99], ["boing", 4.47]], null, null, null, null], "duration": [1.05, 0.32, 0.32, 0.38, 0.18, -0.16, 2.23, 4.52, 0.73, 1.1, 1.41, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/0lCPmaq960E_filtered.json b/annotations_filtered/0lCPmaq960E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb78302852f9e657242253f195fde0929850f119 --- /dev/null +++ b/annotations_filtered/0lCPmaq960E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.77], [43.0, 43.46], [52.0, 52.05], [66.0, 67.31], [68.0, 69.3], [73.0, 79.96], [86.0, 86.8], [90.0, 91.12], [96.0, 96.79], [107.0, 106.93], [109.0, 114.69], [116.0, 116.02], [117.0, 118.94], [120.0, 121.41], [124.0, 124.07], [128.0, 128.56], [131.0, 131.79], [135.0, 135.51], [139.0, 139.5], [143.0, 143.65], [146.0, 146.33], [153.0, 153.98], [155.0, 155.41], [158.0, 158.4], [164.0, 164.15], [177.0, 177.69]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.69, 0.0, 0.0, 0.0, 0.0, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 34.78], ["rowboat, canoe, kayak", 16.1], ["boat, water vehicle", 9.89]], null, null, null, null, [["whale vocalization", 33.04], ["gurgling", 21.47], ["rowboat, canoe, kayak", 10.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.46, 0.05, 1.31, 1.3, 6.96, 0.8, 1.12, 0.79, -0.07, 5.69, 0.02, 1.94, 1.41, 0.07, 0.56, 0.79, 0.51, 0.5, 0.65, 0.33, 0.98, 0.41, 0.4, 0.15, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/0lCR_c5Su1M_filtered.json b/annotations_filtered/0lCR_c5Su1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5477ae1a0d2fecabbce0d6c40461c4854e803c8 --- /dev/null +++ b/annotations_filtered/0lCR_c5Su1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.86], [13.0, 33.56], [38.0, 42.11], [44.0, 53.45], [56.0, 82.09], [86.0, 121.1], [135.0, 148.04], [150.0, 150.26]], "keep_status": [false, false, true, true, false, false, false, false], "silence_prob": [30.85, 30.83, 31.59, 31.73, 30.36, 0.0, 31.08, 0.0], "audiomae_on_audioset": [[["didgeridoo", 45.36], ["music", 24.43], ["speech", 7.76]], [["didgeridoo", 45.96], ["music", 41.97], ["musical instrument", 2.4]], [["music", 42.22], ["effects unit", 9.8], ["hum", 7.5]], [["music", 33.66], ["throbbing", 15.46], ["hum", 14.49]], [["music", 74.79], ["musical instrument", 3.94], ["hum", 3.89]], null, [["music", 65.01], ["hum", 7.98], ["throbbing", 5.1]], null], "duration": [6.86, 20.56, 4.11, 9.45, 26.09, 35.1, 13.04, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/0lNb6NAV6jg_filtered.json b/annotations_filtered/0lNb6NAV6jg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a45262fbb0d428dcfda5574bdc21069459fc9e4c --- /dev/null +++ b/annotations_filtered/0lNb6NAV6jg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.01], [4.0, 8.07], [10.0, 11.11], [12.0, 12.95], [14.0, 14.79], [17.0, 17.93], [19.0, 19.79], [21.0, 23.11], [24.0, 25.07], [26.0, 26.2], [26.0, 26.35], [30.0, 31.33], [33.0, 33.89], [41.0, 41.27], [42.0, 48.17], [50.0, 54.8], [67.0, 70.65], [71.0, 71.64], [73.0, 75.9], [77.0, 77.79], [81.0, 81.75], [86.0, 86.34], [87.0, 94.42], [95.0, 96.55], [98.0, 99.69]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.14, 0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 56.63, 51.66, 0.0, 30.53, 0.0, 0.0, 0.0, 52.86, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.96], ["telephone", 19.23], ["music", 5.78]], null, null, null, null, null, [["chirp tone", 13.98], ["sidetone", 13.34], ["sine wave", 8.64]], null, null, null, null, null, null, null, null, null, null, [["speech", 58.26], ["fart", 31.09], ["synthesizer", 1.28]], null, null, null, null, null, null], "duration": [0.01, 4.07, 1.11, 0.95, 0.79, 0.93, 0.79, 2.11, 1.07, 0.2, 0.35, 1.33, 0.89, 0.27, 6.17, 4.8, 3.65, 0.64, 2.9, 0.79, 0.75, 0.34, 7.42, 1.55, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/0lq1JIWQSlc_filtered.json b/annotations_filtered/0lq1JIWQSlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae240240043933427402144373ca3c3aade86b87 --- /dev/null +++ b/annotations_filtered/0lq1JIWQSlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.85], [8.0, 16.56], [18.0, 19.23], [22.0, 30.99], [33.0, 33.49], [45.0, 46.18], [49.0, 49.94], [53.0, 54.31], [59.0, 64.99], [66.0, 69.04], [71.0, 73.7], [77.0, 77.45], [78.0, 86.73], [88.0, 90.14], [97.0, 97.51], [103.0, 104.21], [107.0, 107.03], [107.0, 111.77], [113.0, 118.03], [120.0, 122.57], [127.0, 140.43], [144.0, 144.91], [146.0, 146.2], [148.0, 159.51], [161.0, 162.19], [165.0, 167.44]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.03, 0.0, 31.25, 0.0, 0.0, 0.0, 0.0, 58.81, 62.37, 40.95, 0.0, 64.86, 50.71, 0.0, 0.0, 0.0, 71.72, 90.43, 94.66, 31.65, 0.0, 0.0, 31.17, 0.0, 91.98], "audiomae_on_audioset": [null, [["music", 51.28], ["boing", 10.68], ["speech", 7.15]], null, [["music", 49.83], ["boing", 36.96], ["whack, thwack", 3.17]], null, null, null, null, null, null, [["music", 31.37], ["hum", 8.19], ["mains hum", 7.2]], null, null, null, null, null, null, null, null, null, [["speech", 19.16], ["cattle, bovinae", 17.42], ["livestock, farm animals, working animals", 15.99]], null, null, [["livestock, farm animals, working animals", 37.37], ["cattle, bovinae", 30.01], ["moo", 19.35]], null, null], "duration": [-0.15, 8.56, 1.23, 8.99, 0.49, 1.18, 0.94, 1.31, 5.99, 3.04, 2.7, 0.45, 8.73, 2.14, 0.51, 1.21, 0.03, 4.77, 5.03, 2.57, 13.43, 0.91, 0.2, 11.51, 1.19, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/0m5VGBc8VrQ_filtered.json b/annotations_filtered/0m5VGBc8VrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2b85e3b55656c2ee6ff7229084cc9f2e5c309bb --- /dev/null +++ b/annotations_filtered/0m5VGBc8VrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.81], [38.0, 38.65], [40.0, 40.49], [41.0, 42.47], [45.0, 48.51], [53.0, 53.82], [55.0, 56.17], [58.0, 59.02], [62.0, 63.48], [67.0, 67.44], [70.0, 70.82], [74.0, 74.21], [75.0, 76.62], [78.0, 78.17], [80.0, 80.76], [81.0, 83.22], [84.0, 85.11], [88.0, 89.34], [93.0, 94.58], [95.0, 96.11], [99.0, 99.44], [106.0, 106.47], [107.0, 109.39], [111.0, 111.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.65, 0.49, 1.47, 3.51, 0.82, 1.17, 1.02, 1.48, 0.44, 0.82, 0.21, 1.62, 0.17, 0.76, 2.22, 1.11, 1.34, 1.58, 1.11, 0.44, 0.47, 2.39, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/0mGmEE20CR0_filtered.json b/annotations_filtered/0mGmEE20CR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23782d871a746abb1283ea5768a70c1c736c7756 --- /dev/null +++ b/annotations_filtered/0mGmEE20CR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.74], [6.0, 6.72], [12.0, 11.91], [21.0, 23.33], [27.0, 37.4], [47.0, 75.41], [83.0, 84.69], [87.0, 88.32], [89.0, 95.57], [98.0, 98.74], [105.0, 105.93], [108.0, 109.34], [112.0, 114.3], [118.0, 125.46], [127.0, 128.22], [133.0, 136.46], [140.0, 140.24], [159.0, 158.87], [162.0, 162.18], [166.0, 166.7]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.95, 37.44, 30.85, 0.0, 0.0, 44.6, 0.0, 0.0, 0.0, 39.3, 38.36, 0.0, 32.46, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 53.68], ["music", 7.72], ["vehicle", 3.84]], [["music", 65.76], ["musical instrument", 4.15], ["synthesizer", 4.14]], [["fly, housefly", 14.73], ["insect", 10.65], ["hum", 9.45]], null, null, [["animal", 17.98], ["music", 11.22], ["domestic animals, pets", 6.3]], null, null, null, [["didgeridoo", 35.65], ["music", 17.58], ["sound effect", 4.3]], [["music", 34.7], ["whale vocalization", 20.56], ["synthesizer", 6.07]], null, [["didgeridoo", 31.38], ["music", 19.72], ["speech", 14.31]], null, null, null, null], "duration": [-0.26, 0.72, -0.09, 2.33, 10.4, 28.41, 1.69, 1.32, 6.57, 0.74, 0.93, 1.34, 2.3, 7.46, 1.22, 3.46, 0.24, -0.13, 0.18, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/0mPTGVoG248_filtered.json b/annotations_filtered/0mPTGVoG248_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2437c6555036c53fd9e3a5a4dd8ac65ca9873be --- /dev/null +++ b/annotations_filtered/0mPTGVoG248_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 104.13], [106.0, 122.79], [124.0, 130.05], [130.0, 130.1], [131.0, 151.5]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 29.22, 28.78, 0.0, 29.34], "audiomae_on_audioset": [null, [["whack, thwack", 30.18], ["sound effect", 13.52], ["music", 8.38]], [["music", 41.98], ["breaking", 15.96], ["reverberation", 6.81]], null, [["breaking", 21.5], ["smash, crash", 19.92], ["music", 7.89]]], "duration": [46.13, 16.79, 6.05, 0.1, 20.5]} \ No newline at end of file diff --git a/annotations_filtered/0mRRULBvuj0_filtered.json b/annotations_filtered/0mRRULBvuj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89ba791e4f88ac564c0ad22aa41d7fe7384dc6bd --- /dev/null +++ b/annotations_filtered/0mRRULBvuj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.2], [23.0, 24.49], [26.0, 27.03], [31.0, 32.36], [35.0, 35.88], [39.0, 39.72], [44.0, 44.19], [50.0, 50.58], [53.0, 54.11], [56.0, 56.2], [57.0, 60.44], [61.0, 63.04], [76.0, 77.36], [80.0, 80.69], [96.0, 97.46], [99.0, 100.45], [106.0, 106.19], [109.0, 173.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.82, 39.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 62.92], ["throbbing", 4.74], ["drum machine", 2.73]], [["music", 38.7], ["throbbing", 15.96], ["hum", 14.75]], null, null, null, null, null, null], "duration": [1.2, 1.49, 1.03, 1.36, 0.88, 0.72, 0.19, 0.58, 1.11, 0.2, 3.44, 2.04, 1.36, 0.69, 1.46, 1.45, 0.19, 64.89]} \ No newline at end of file diff --git a/annotations_filtered/0mjSZpCpsdc_filtered.json b/annotations_filtered/0mjSZpCpsdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb4011abb76777d8eebb2ee00deeb77ffea32346 --- /dev/null +++ b/annotations_filtered/0mjSZpCpsdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.72], [10.0, 10.4], [14.0, 27.21], [33.0, 33.4], [35.0, 92.15], [93.0, 95.32], [96.0, 98.41], [99.0, 101.93], [102.0, 111.21], [115.0, 117.69], [119.0, 119.35], [121.0, 123.79], [124.0, 124.39], [126.0, 127.89], [132.0, 132.26], [135.0, 135.35], [137.0, 136.95], [138.0, 139.14], [142.0, 142.87], [143.0, 143.99], [144.0, 146.11], [148.0, 149.12], [152.0, 152.04], [156.0, 157.1], [158.0, 158.87], [160.0, 161.82], [163.0, 165.79]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [76.2, 0.0, 30.94, 0.0, 0.0, 46.05, 38.51, 39.96, 38.59, 46.57, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55], "audiomae_on_audioset": [null, null, [["breaking", 27.64], ["music", 18.11], ["hum", 8.07]], null, null, [["music", 23.87], ["speech", 21.72], ["singing bowl", 20.71]], [["tuning fork", 42.59], ["sine wave", 32.82], ["chirp tone", 10.38]], [["speech", 31.74], ["music", 18.98], ["singing bowl", 16.37]], [["hum", 33.08], ["speech", 32.18], ["mains hum", 12.81]], [["hum", 31.94], ["speech", 20.27], ["throbbing", 14.94]], null, null, null, null, null, null, null, null, null, null, [["speech", 61.96], ["animal", 3.28], ["dog", 2.59]], null, null, null, null, null, null], "duration": [5.72, 0.4, 13.21, 0.4, 57.15, 2.32, 2.41, 2.93, 9.21, 2.69, 0.35, 2.79, 0.39, 1.89, 0.26, 0.35, -0.05, 1.14, 0.87, 0.99, 2.11, 1.12, 0.04, 1.1, 0.87, 1.82, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/0mmSi-63Y9U_filtered.json b/annotations_filtered/0mmSi-63Y9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..221928fd0780e3b7b2643f21a8e26da3a63133d0 --- /dev/null +++ b/annotations_filtered/0mmSi-63Y9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [4.0, 4.19], [8.0, 8.46], [14.0, 15.23], [22.0, 23.16], [25.0, 27.14], [32.0, 34.74], [35.0, 36.95], [43.0, 42.84], [46.0, 46.31], [48.0, 47.87], [48.0, 49.49], [53.0, 54.18], [56.0, 55.68], [56.0, 56.51], [59.0, 59.85], [63.0, 63.58], [65.0, 65.42], [77.0, 77.99], [78.0, 79.73], [88.0, 88.23], [89.0, 89.99], [98.0, 98.05], [100.0, 99.96], [102.0, 102.64], [104.0, 104.46], [116.0, 116.28], [125.0, 125.27], [126.0, 126.44], [128.0, 127.79], [130.0, 129.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.07, 52.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.19, 0.46, 1.23, 1.16, 2.14, 2.74, 1.95, -0.16, 0.31, -0.13, 1.49, 1.18, -0.32, 0.51, 0.85, 0.58, 0.42, 0.99, 1.73, 0.23, 0.99, 0.05, -0.04, 0.64, 0.46, 0.28, 0.27, 0.44, -0.21, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/0mwMM8VrYmw_filtered.json b/annotations_filtered/0mwMM8VrYmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5d8de5bd7acbd5996641a3c1e2933a1c9bc7891 --- /dev/null +++ b/annotations_filtered/0mwMM8VrYmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.66], [11.0, 18.13], [19.0, 22.06], [23.0, 24.97], [28.0, 28.83], [30.0, 30.28], [34.0, 34.72], [41.0, 42.23], [45.0, 47.56], [50.0, 50.92], [53.0, 53.37], [58.0, 58.85], [59.0, 59.22], [61.0, 61.16], [65.0, 64.96], [67.0, 67.61], [73.0, 74.22], [76.0, 77.3], [80.0, 84.45], [85.0, 86.98], [90.0, 92.04], [95.0, 96.58], [99.0, 99.81], [107.0, 108.18], [109.0, 109.65], [110.0, 110.76], [112.0, 114.13], [115.0, 118.08], [120.0, 120.77], [123.0, 125.42], [126.0, 127.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.05, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.73, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 7.13, 3.06, 1.97, 0.83, 0.28, 0.72, 1.23, 2.56, 0.92, 0.37, 0.85, 0.22, 0.16, -0.04, 0.61, 1.22, 1.3, 4.45, 1.98, 2.04, 1.58, 0.81, 1.18, 0.65, 0.76, 2.13, 3.08, 0.77, 2.42, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/0mwkZUkwEHw_filtered.json b/annotations_filtered/0mwkZUkwEHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..160e2d8bbed1e5a5949d5da95fa03c47918da208 --- /dev/null +++ b/annotations_filtered/0mwkZUkwEHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [4.0, 5.07], [14.0, 14.74], [16.0, 16.65], [19.0, 19.18], [21.0, 21.41], [24.0, 24.93], [26.0, 28.04], [36.0, 38.23], [40.0, 45.45], [48.0, 56.69], [66.0, 66.34], [68.0, 73.08], [75.0, 76.5], [77.0, 78.46], [80.0, 88.65], [93.0, 97.77], [102.0, 105.7], [113.0, 117.59], [118.0, 120.75], [123.0, 131.19]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.93, 42.26, 40.54, 40.66, 0.0, 34.36, 0.0, 0.0, 31.63, 30.87, 33.76, 61.67, 49.68, 60.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 35.97], ["speech", 31.57], ["sidetone", 7.56]], [["speech", 23.15], ["music", 23.14], ["didgeridoo", 8.13]], [["music", 38.6], ["hum", 22.36], ["throbbing", 11.82]], [["music", 33.68], ["hum", 27.46], ["throbbing", 13.75]], null, [["music", 31.89], ["hum", 14.78], ["throbbing", 11.33]], null, null, [["music", 52.83], ["hum", 16.86], ["mains hum", 8.86]], [["music", 45.63], ["speech", 24.62], ["whale vocalization", 13.51]], [["speech", 11.13], ["music", 8.12], ["animal", 6.15]], null, [["sidetone", 39.05], ["speech", 22.84], ["music", 16.7]], null], "duration": [1.42, 1.07, 0.74, 0.65, 0.18, 0.41, 0.93, 2.04, 2.23, 5.45, 8.69, 0.34, 5.08, 1.5, 1.46, 8.65, 4.77, 3.7, 4.59, 2.75, 8.19]} \ No newline at end of file diff --git a/annotations_filtered/0nfoP3bmd1c_filtered.json b/annotations_filtered/0nfoP3bmd1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f8a87956ff2b9da786c09efe14b0e701bbe5e30 --- /dev/null +++ b/annotations_filtered/0nfoP3bmd1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [2.0, 2.98], [6.0, 6.24], [8.0, 8.07], [8.0, 8.72], [9.0, 11.28], [13.0, 13.91], [16.0, 16.41], [20.0, 20.75], [25.0, 26.28], [28.0, 27.99], [29.0, 29.78], [30.0, 31.68], [32.0, 32.58], [34.0, 34.38], [40.0, 40.24], [42.0, 42.4], [57.0, 57.0], [59.0, 59.05], [59.0, 59.44], [64.0, 64.88], [66.0, 67.46], [68.0, 69.16], [71.0, 71.74], [74.0, 74.61], [76.0, 76.81], [80.0, 80.86], [81.0, 82.17], [83.0, 83.78], [87.0, 88.3], [91.0, 91.05], [95.0, 94.93], [95.0, 95.0], [95.0, 95.13], [95.0, 95.74], [100.0, 100.53], [113.0, 113.26], [117.0, 118.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.98, 0.24, 0.07, 0.72, 2.28, 0.91, 0.41, 0.75, 1.28, -0.01, 0.78, 1.68, 0.58, 0.38, 0.24, 0.4, 0.0, 0.05, 0.44, 0.88, 1.46, 1.16, 0.74, 0.61, 0.81, 0.86, 1.17, 0.78, 1.3, 0.05, -0.07, 0.0, 0.13, 0.74, 0.53, 0.26, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/0niEZsahtEo_filtered.json b/annotations_filtered/0niEZsahtEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b648b901dd7295800b9dd299380ce6aea7ba7bf --- /dev/null +++ b/annotations_filtered/0niEZsahtEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.94], [28.0, 28.26], [32.0, 38.03], [38.0, 53.32], [55.0, 58.43], [59.0, 102.96], [104.0, 106.47], [107.0, 106.79], [107.0, 106.83]], "keep_status": [true, false, true, false, false, false, false, false, false], "silence_prob": [47.35, 0.0, 46.5, 51.07, 66.03, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [[["eruption", 29.11], ["speech", 17.19], ["explosion", 7.86]], null, [["speech", 30.0], ["crow", 8.32], ["caw", 5.8]], null, null, null, null, null, null], "duration": [18.94, 0.26, 6.03, 15.32, 3.43, 43.96, 2.47, -0.21, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/0noY-XrAJRg_filtered.json b/annotations_filtered/0noY-XrAJRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2a84c6f4f7ff1d3bd1f5665f9a50385c0b12c18 --- /dev/null +++ b/annotations_filtered/0noY-XrAJRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [4.0, 5.7], [6.0, 7.72], [10.0, 11.92], [14.0, 22.18], [24.0, 24.54], [25.0, 25.56], [29.0, 30.38], [31.0, 32.66], [33.0, 36.24], [37.0, 38.3], [39.0, 39.04], [39.0, 39.95], [40.0, 40.34], [40.0, 40.8], [41.0, 41.2], [47.0, 47.17], [49.0, 48.66], [49.0, 49.28], [49.0, 49.96], [51.0, 51.34], [53.0, 53.5], [55.0, 55.8], [57.0, 56.84], [59.0, 59.44], [60.0, 61.53], [62.0, 62.92], [64.0, 67.19], [68.0, 69.13], [71.0, 70.97], [72.0, 72.45], [74.0, 91.03], [92.0, 92.23], [97.0, 97.7], [98.0, 150.13], [152.0, 154.01], [155.0, 157.96], [160.0, 160.88], [162.0, 165.03], [167.0, 176.17]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 0.0, 46.29, 32.63, 0.0, 31.46, 32.15], "audiomae_on_audioset": [null, null, null, null, [["music", 35.74], ["hum", 10.53], ["mains hum", 7.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.14], ["speech", 28.29], ["hum", 4.79]], null, null, null, [["music", 68.15], ["scary music", 7.54], ["ambient music", 2.74]], [["music", 15.45], ["theremin", 9.62], ["didgeridoo", 8.93]], null, [["music", 27.84], ["hum", 17.24], ["throbbing", 13.45]], [["music", 31.36], ["speech", 16.8], ["thunk", 8.34]]], "duration": [1.74, 1.7, 1.72, 1.92, 8.18, 0.54, 0.56, 1.38, 1.66, 3.24, 1.3, 0.04, 0.95, 0.34, 0.8, 0.2, 0.17, -0.34, 0.28, 0.96, 0.34, 0.5, 0.8, -0.16, 0.44, 1.53, 0.92, 3.19, 1.13, -0.03, 0.45, 17.03, 0.23, 0.7, 52.13, 2.01, 2.96, 0.88, 3.03, 9.17]} \ No newline at end of file diff --git a/annotations_filtered/0npouzhhZTo_filtered.json b/annotations_filtered/0npouzhhZTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c68306441eb7400f346a3c30b993250478bcb0d --- /dev/null +++ b/annotations_filtered/0npouzhhZTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.04], [27.0, 31.9], [38.0, 42.57], [45.0, 44.93], [46.0, 56.4], [61.0, 79.15], [82.0, 86.91], [88.0, 87.76], [91.0, 91.62], [92.0, 99.03], [100.0, 100.58], [109.0, 109.63], [111.0, 112.13], [112.0, 116.07], [119.0, 119.38], [121.0, 121.9], [128.0, 135.77], [140.0, 142.69]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.86, 33.2, 0.0, 33.23, 32.61, 32.58, 0.0, 0.0, 34.27, 0.0, 0.0, 0.0, 33.06, 0.0, 0.0, 32.67, 32.8], "audiomae_on_audioset": [null, [["music", 76.02], ["funk", 2.99], ["soul music", 1.99]], [["music", 57.44], ["music of bollywood", 3.36], ["electronic music", 3.05]], null, [["music", 87.45], ["soul music", 1.28], ["singing", 0.88]], [["music", 84.39], ["christmas music", 1.04], ["soul music", 0.98]], [["music", 63.45], ["music of bollywood", 4.28], ["electronic music", 3.39]], null, null, [["music", 81.64], ["electronic music", 2.12], ["funk", 1.33]], null, null, null, [["music", 76.84], ["soul music", 3.64], ["singing", 1.95]], null, null, [["music", 81.41], ["music of bollywood", 1.69], ["electronic music", 1.25]], [["music", 68.0], ["electronic music", 3.06], ["synthetic singing", 1.31]]], "duration": [0.04, 4.9, 4.57, -0.07, 10.4, 18.15, 4.91, -0.24, 0.62, 7.03, 0.58, 0.63, 1.13, 4.07, 0.38, 0.9, 7.77, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/0o9Fm3hnpYQ_filtered.json b/annotations_filtered/0o9Fm3hnpYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04877033f4a8cb3ac51f50d872f8502e0bb4571b --- /dev/null +++ b/annotations_filtered/0o9Fm3hnpYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [10.0, 10.45], [12.0, 15.18], [22.0, 22.76], [27.0, 32.05], [39.0, 39.99], [41.0, 41.76], [43.0, 46.8], [48.0, 52.02], [65.0, 65.91], [66.0, 67.54], [82.0, 82.16], [84.0, 85.29], [96.0, 96.65], [97.0, 100.18], [101.0, 107.32], [110.0, 113.73], [123.0, 139.72], [142.0, 147.87], [149.0, 150.13], [150.0, 151.71], [152.0, 153.37], [164.0, 164.76], [168.0, 167.81], [173.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.07, 0.0, 41.38, 0.0, 0.0, 46.22, 41.89, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 38.71, 36.37, 42.51, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.19], ["theremin", 6.56], ["musical instrument", 2.5]], null, [["music", 75.52], ["musical instrument", 3.12], ["synthesizer", 1.52]], null, null, [["music", 51.93], ["boing", 7.11], ["hum", 3.69]], [["music", 28.61], ["wail, moan", 6.22], ["fly, housefly", 5.13]], null, null, null, null, null, [["music", 40.69], ["speech", 25.13], ["musical instrument", 2.98]], [["music", 28.93], ["mains hum", 19.27], ["hum", 13.23]], [["music", 57.12], ["livestock, farm animals, working animals", 3.76], ["animal", 3.62]], [["music", 49.57], ["speech", 11.42], ["musical instrument", 7.51]], null, null, null, null, null, null, null], "duration": [0.64, 0.45, 3.18, 0.76, 5.05, 0.99, 0.76, 3.8, 4.02, 0.91, 1.54, 0.16, 1.29, 0.65, 3.18, 6.32, 3.73, 16.72, 5.87, 1.13, 1.71, 1.37, 0.76, -0.19, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/0oFdsgLP8n8_filtered.json b/annotations_filtered/0oFdsgLP8n8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c483485b8350df26133ba2acffe2ca809b7d56fc --- /dev/null +++ b/annotations_filtered/0oFdsgLP8n8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [5.0, 6.02], [11.0, 13.69], [16.0, 16.44], [17.0, 17.58], [19.0, 20.21], [24.0, 25.22], [26.0, 26.47], [28.0, 30.11], [36.0, 36.54], [40.0, 41.76], [52.0, 52.57], [57.0, 59.58], [63.0, 65.08], [70.0, 71.04], [75.0, 75.36], [78.0, 78.26], [80.0, 82.65], [84.0, 84.01], [86.0, 88.08], [94.0, 94.49], [96.0, 96.84], [101.0, 100.9], [103.0, 103.72], [105.0, 105.0], [108.0, 109.59], [110.0, 110.4], [112.0, 113.53], [114.0, 115.05], [117.0, 118.25], [121.0, 122.18], [125.0, 125.34], [126.0, 126.44], [129.0, 129.93], [133.0, 135.84], [137.0, 137.76], [140.0, 141.35]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 32.1, 76.86, 0.0, 0.0, 0.0, 100.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sine wave", 19.64], ["sidetone", 16.27], ["busy signal", 13.58]], null, null, null, [["speech", 56.03], ["quack", 10.18], ["music", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.02, 2.69, 0.44, 0.58, 1.21, 1.22, 0.47, 2.11, 0.54, 1.76, 0.57, 2.58, 2.08, 1.04, 0.36, 0.26, 2.65, 0.01, 2.08, 0.49, 0.84, -0.1, 0.72, 0.0, 1.59, 0.4, 1.53, 1.05, 1.25, 1.18, 0.34, 0.44, 0.93, 2.84, 0.76, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/0oHT-rtiFZk_filtered.json b/annotations_filtered/0oHT-rtiFZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ca973706372546d0180982c52498c5468f03c2 --- /dev/null +++ b/annotations_filtered/0oHT-rtiFZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.62], [34.0, 34.35], [37.0, 38.06], [39.0, 39.53], [46.0, 51.58], [52.0, 52.24], [58.0, 65.84], [90.0, 90.0], [91.0, 93.83], [96.0, 99.22], [104.0, 104.52], [105.0, 105.46], [107.0, 108.3], [126.0, 125.86], [128.0, 129.14], [130.0, 131.19], [136.0, 136.58], [137.0, 137.12], [139.0, 139.73], [142.0, 142.11], [144.0, 146.23], [150.0, 150.72], [156.0, 157.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 51.44, 0.0, 92.48, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.37], ["music", 24.78], ["hum", 14.63]], null, null], "duration": [0.62, 0.35, 1.06, 0.53, 5.58, 0.24, 7.84, 0.0, 2.83, 3.22, 0.52, 0.46, 1.3, -0.14, 1.14, 1.19, 0.58, 0.12, 0.73, 0.11, 2.23, 0.72, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/0osA8jKKotc_filtered.json b/annotations_filtered/0osA8jKKotc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..642baf7ec41615a654ed5d7bb20c012f687b6d5c --- /dev/null +++ b/annotations_filtered/0osA8jKKotc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [11.0, 12.06], [13.0, 15.4], [16.0, 18.94], [22.0, 23.7], [24.0, 27.41], [29.0, 32.66], [36.0, 52.0], [52.0, 60.57], [65.0, 66.53], [67.0, 70.77], [72.0, 71.79], [73.0, 73.65], [75.0, 75.2], [76.0, 78.51], [80.0, 80.05], [81.0, 82.27], [83.0, 114.94], [116.0, 136.85], [140.0, 140.49], [142.0, 148.29], [149.0, 149.49], [150.0, 151.09], [153.0, 157.45], [158.0, 158.5], [159.0, 162.3], [165.0, 164.78], [172.0, 173.4], [175.0, 175.02], [175.0, 176.42], [181.0, 192.33], [194.0, 194.05], [196.0, 197.28], [198.0, 198.63], [202.0, 202.32], [203.0, 204.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.05, 95.51, 0.0, 98.36, 97.54, 99.16, 99.98, 0.0, 80.46, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 32.94, 0.0, 74.92, 0.0, 0.0, 43.93, 0.0, 39.8, 0.0, 0.0, 0.0, 0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 31.99], ["grunt", 22.55], ["cattle, bovinae", 16.11]], null, null, null, null, [["music", 40.69], ["speech", 10.2], ["synthesizer", 8.17]], null, [["music", 37.02], ["speech", 24.36], ["foghorn", 4.94]], null, null, null, null, [["music", 36.39], ["theremin", 29.74], ["synthesizer", 10.16]], null, null, null, null, null], "duration": [1.68, 1.06, 2.4, 2.94, 1.7, 3.41, 3.66, 16.0, 8.57, 1.53, 3.77, -0.21, 0.65, 0.2, 2.51, 0.05, 1.27, 31.94, 20.85, 0.49, 6.29, 0.49, 1.09, 4.45, 0.5, 3.3, -0.22, 1.4, 0.02, 1.42, 11.33, 0.05, 1.28, 0.63, 0.32, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/0oxx_2M6Ctw_filtered.json b/annotations_filtered/0oxx_2M6Ctw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f1d566d3cd893a39567355140c15045b3981f61 --- /dev/null +++ b/annotations_filtered/0oxx_2M6Ctw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [7.0, 7.53], [13.0, 13.74], [14.0, 14.4], [19.0, 19.14], [19.0, 19.72], [20.0, 20.44], [21.0, 21.96], [23.0, 25.05], [29.0, 30.33], [32.0, 32.68], [34.0, 34.79], [38.0, 38.26], [39.0, 64.81], [74.0, 74.75], [75.0, 76.42], [78.0, 78.88], [80.0, 80.64], [83.0, 82.75], [87.0, 88.11], [89.0, 89.61], [105.0, 105.95], [107.0, 109.41], [110.0, 112.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1, 0.0, 0.0, 0.0, 0.0, 29.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.97, 32.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 58.04], ["sidetone", 9.99], ["radio", 9.94]], null, null, null, null, [["music", 34.25], ["didgeridoo", 8.5], ["effects unit", 6.99]], null, null, null, null, null, null, null, null, null, [["boing", 26.07], ["music", 23.61], ["speech", 13.1]]], "duration": [0.66, 0.53, 0.74, 0.4, 0.14, 0.72, 0.44, 0.96, 2.05, 1.33, 0.68, 0.79, 0.26, 25.81, 0.75, 1.42, 0.88, 0.64, -0.25, 1.11, 0.61, 0.95, 2.41, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/0p1fLn6_ExE_filtered.json b/annotations_filtered/0p1fLn6_ExE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da3c92c4a14b69bb6640b54e5fe7bed84b7c418c --- /dev/null +++ b/annotations_filtered/0p1fLn6_ExE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.64], [13.0, 18.32], [20.0, 27.3], [29.0, 61.72], [62.0, 62.04], [62.0, 62.07], [62.0, 62.46], [62.0, 63.17], [63.0, 63.21], [63.0, 63.24], [63.0, 63.31], [63.0, 63.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.55, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 43.09], ["mains hum", 22.19], ["music", 11.47]], null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 5.32, 7.3, 32.72, 0.04, 0.07, 0.46, 1.17, 0.21, 0.24, 0.31, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/0p2Oyd040pg_filtered.json b/annotations_filtered/0p2Oyd040pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27dd3ff9cd348b46dfc97a4cf7c72359cc092e1c --- /dev/null +++ b/annotations_filtered/0p2Oyd040pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.45], [12.0, 14.71], [15.0, 16.73], [17.0, 17.56], [18.0, 19.63], [22.0, 22.55], [25.0, 26.08], [27.0, 28.05], [30.0, 33.44], [35.0, 43.21], [46.0, 46.33], [50.0, 50.16], [60.0, 62.23], [71.0, 71.2], [73.0, 72.66], [73.0, 73.58], [75.0, 75.27], [77.0, 78.21], [79.0, 88.96], [91.0, 92.75], [94.0, 95.32], [96.0, 97.95], [99.0, 99.55], [101.0, 104.06], [104.0, 104.72], [110.0, 112.83], [116.0, 155.75], [156.0, 158.21], [161.0, 161.81], [163.0, 163.58], [171.0, 193.89], [196.0, 235.75], [238.0, 238.74], [240.0, 255.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 39.17, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 98.27, 0.0, 87.92, 0.0, 0.0, 32.0, 0.0, 0.0, 30.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 71.71], ["hum", 4.69], ["sidetone", 3.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.52], ["speech", 16.22], ["inside, small room", 6.27]], null, null, null, null, null, null, [["noise", 35.34], ["hum", 7.87], ["music", 7.87]], null, null, [["music", 36.42], ["speech", 22.17], ["synthesizer", 6.06]]], "duration": [0.45, 2.71, 1.73, 0.56, 1.63, 0.55, 1.08, 1.05, 3.44, 8.21, 0.33, 0.16, 2.23, 0.2, -0.34, 0.58, 0.27, 1.21, 9.96, 1.75, 1.32, 1.95, 0.55, 3.06, 0.72, 2.83, 39.75, 2.21, 0.81, 0.58, 22.89, 39.75, 0.74, 15.9]} \ No newline at end of file diff --git a/annotations_filtered/0p9Q6tDJJ1w_filtered.json b/annotations_filtered/0p9Q6tDJJ1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..031ab03aead9de9f30447ad1564c806ab366d6d2 --- /dev/null +++ b/annotations_filtered/0p9Q6tDJJ1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.77], [9.0, 9.76], [12.0, 13.09], [14.0, 15.77], [18.0, 41.47], [43.0, 42.77], [44.0, 44.37], [48.0, 48.79], [50.0, 51.07], [53.0, 55.54], [57.0, 58.08], [62.0, 62.51], [63.0, 63.48], [66.0, 66.29], [75.0, 77.5], [80.0, 80.2], [83.0, 83.67], [85.0, 90.24], [90.0, 91.18], [94.0, 94.09], [96.0, 96.25], [97.0, 97.97], [100.0, 103.77], [104.0, 106.74], [108.0, 108.85], [113.0, 113.8], [116.0, 117.1], [123.0, 124.53], [126.0, 131.46], [135.0, 136.98], [137.0, 138.77], [139.0, 159.36], [161.0, 161.55], [162.0, 161.89], [164.0, 164.24], [165.0, 165.99]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.26, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 91.13, 99.21, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 25.25], ["didgeridoo", 14.19], ["music", 11.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.76, 1.09, 1.77, 23.47, -0.23, 0.37, 0.79, 1.07, 2.54, 1.08, 0.51, 0.48, 0.29, 2.5, 0.2, 0.67, 5.24, 1.18, 0.09, 0.25, 0.97, 3.77, 2.74, 0.85, 0.8, 1.1, 1.53, 5.46, 1.98, 1.77, 20.36, 0.55, -0.11, 0.24, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/0p9yD4E2hQw_filtered.json b/annotations_filtered/0p9yD4E2hQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75673ff1e68eee6522239389dec0934242da5d37 --- /dev/null +++ b/annotations_filtered/0p9yD4E2hQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [10.0, 13.98], [15.0, 22.06], [23.0, 24.09], [26.0, 28.44], [35.0, 35.77], [41.0, 42.2], [45.0, 45.6], [46.0, 46.95], [49.0, 51.85], [53.0, 53.79], [55.0, 56.61], [61.0, 62.88], [66.0, 67.68], [68.0, 73.31], [74.0, 74.71], [75.0, 76.08], [89.0, 91.34], [93.0, 108.24], [109.0, 111.18], [112.0, 115.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 100.0, 100.0, 100.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 3.98, 7.06, 1.09, 2.44, 0.77, 1.2, 0.6, 0.95, 2.85, 0.79, 1.61, 1.88, 1.68, 5.31, 0.71, 1.08, 2.34, 15.24, 2.18, 3.37]} \ No newline at end of file diff --git a/annotations_filtered/0pRYoClF9w4_filtered.json b/annotations_filtered/0pRYoClF9w4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76cd5153add907b4c55c9108cc0ed55f9510e13b --- /dev/null +++ b/annotations_filtered/0pRYoClF9w4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.11], [9.0, 9.15], [14.0, 15.08], [16.0, 19.9], [27.0, 27.73], [30.0, 31.23], [35.0, 36.26], [40.0, 43.04], [48.0, 56.88], [59.0, 60.93], [64.0, 65.7], [67.0, 68.77], [73.0, 73.74], [78.0, 84.81], [89.0, 90.56], [92.0, 91.99], [92.0, 92.1], [94.0, 116.53], [126.0, 126.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.17, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 67.25, 91.81, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 50.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 0.15, 1.08, 3.9, 0.73, 1.23, 1.26, 3.04, 8.88, 1.93, 1.7, 1.77, 0.74, 6.81, 1.56, -0.01, 0.1, 22.53, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/0pUMzDEV-DE_filtered.json b/annotations_filtered/0pUMzDEV-DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a1ae652a0eb39afed853e0a19e15bdfc252f086 --- /dev/null +++ b/annotations_filtered/0pUMzDEV-DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.87], [23.0, 22.99], [25.0, 31.46], [32.0, 32.91], [38.0, 42.69], [44.0, 51.87], [53.0, 59.53], [63.0, 83.1], [83.0, 84.25], [87.0, 109.19], [110.0, 118.39]], "keep_status": [true, false, true, false, true, false, false, false, false, true, true], "silence_prob": [29.9, 0.0, 32.38, 0.0, 29.36, 29.54, 29.63, 29.58, 0.0, 29.52, 29.5], "audiomae_on_audioset": [[["music", 51.25], ["throbbing", 8.94], ["hum", 5.97]], null, [["sonar", 22.16], ["rumble", 22.15], ["music", 13.55]], null, [["hum", 30.36], ["mains hum", 21.56], ["throbbing", 12.03]], [["music", 53.81], ["didgeridoo", 10.6], ["throbbing", 9.18]], [["music", 58.99], ["throbbing", 12.65], ["didgeridoo", 6.33]], [["music", 49.89], ["speech", 14.18], ["throbbing", 7.4]], null, [["music", 31.35], ["speech", 20.29], ["hum", 16.42]], [["speech", 36.74], ["hum", 12.46], ["music", 10.54]]], "duration": [4.87, -0.01, 6.46, 0.91, 4.69, 7.87, 6.53, 20.1, 1.25, 22.19, 8.39]} \ No newline at end of file diff --git a/annotations_filtered/0pVwRO2dFVs_filtered.json b/annotations_filtered/0pVwRO2dFVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df03e9b6c85561eed60b7339ff5c5c89d5c4d89f --- /dev/null +++ b/annotations_filtered/0pVwRO2dFVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.53], [20.0, 20.04], [23.0, 26.84], [32.0, 38.52], [39.0, 40.61], [42.0, 43.51], [49.0, 49.99], [54.0, 53.99], [55.0, 56.93], [60.0, 60.59], [63.0, 64.22], [66.0, 67.07], [68.0, 73.63], [78.0, 80.35], [83.0, 86.26], [88.0, 89.8], [92.0, 93.06], [94.0, 95.82], [96.0, 97.7], [99.0, 99.0], [101.0, 105.26], [110.0, 110.61], [112.0, 114.4], [118.0, 118.23], [120.0, 122.05], [126.0, 135.72]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 38.95, 34.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.84, 38.56, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 33.3, 0.0, 32.71, 0.0, 51.94, 32.4], "audiomae_on_audioset": [null, null, [["speech", 40.22], ["mains hum", 5.88], ["hum", 5.59]], [["speech", 23.68], ["telephone bell ringing", 23.59], ["telephone", 18.68]], null, null, null, null, null, null, null, null, [["hum", 30.98], ["mains hum", 26.62], ["music", 15.17]], [["cacophony", 10.74], ["hum", 8.65], ["whale vocalization", 8.31]], [["creak", 56.35], ["civil defense siren", 5.75], ["hum", 3.28]], null, null, null, null, null, [["music", 41.7], ["theremin", 10.48], ["effects unit", 7.85]], null, [["livestock, farm animals, working animals", 12.19], ["hum", 10.04], ["throbbing", 9.2]], null, null, [["speech", 34.12], ["music", 11.84], ["single-lens reflex camera", 8.23]]], "duration": [1.53, 0.04, 3.84, 6.52, 1.61, 1.51, 0.99, -0.01, 1.93, 0.59, 1.22, 1.07, 5.63, 2.35, 3.26, 1.8, 1.06, 1.82, 1.7, 0.0, 4.26, 0.61, 2.4, 0.23, 2.05, 9.72]} \ No newline at end of file diff --git a/annotations_filtered/0pbdha7w0V0_filtered.json b/annotations_filtered/0pbdha7w0V0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c62df509a0e472002296f6c0887288ce20c6c48 --- /dev/null +++ b/annotations_filtered/0pbdha7w0V0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.8], [10.0, 70.39], [71.0, 71.93], [72.0, 71.96], [72.0, 72.05], [72.0, 104.03]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.2, 60.39, 0.93, -0.04, 0.05, 32.03]} \ No newline at end of file diff --git a/annotations_filtered/0q3BH18BmZI_filtered.json b/annotations_filtered/0q3BH18BmZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac0643a8979aa1cf55f52cad01fddf1e54f6de3d --- /dev/null +++ b/annotations_filtered/0q3BH18BmZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [4.0, 7.13], [8.0, 10.02], [14.0, 15.33], [21.0, 21.63], [23.0, 29.39], [33.0, 39.53], [41.0, 41.81], [45.0, 44.73], [48.0, 48.44], [52.0, 52.59], [53.0, 56.89], [60.0, 61.01], [62.0, 65.28], [66.0, 68.05], [71.0, 72.82], [75.0, 82.26], [87.0, 87.29], [91.0, 91.98], [93.0, 93.63], [97.0, 97.5], [99.0, 99.55], [103.0, 104.46], [109.0, 111.81], [116.0, 116.41], [119.0, 118.84], [124.0, 126.57], [128.0, 128.44], [130.0, 130.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.87, 80.11, 0.0, 0.0, 78.04, 43.77, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 74.44, 89.36, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 90.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.19], ["throbbing", 5.58], ["hum", 3.57]], null, null, null, null, [["music", 38.81], ["sidetone", 23.58], ["speech", 6.2]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.65], ["sidetone", 17.23], ["music", 16.15]], null, null, null, null, null], "duration": [0.37, 3.13, 2.02, 1.33, 0.63, 6.39, 6.53, 0.81, -0.27, 0.44, 0.59, 3.89, 1.01, 3.28, 2.05, 1.82, 7.26, 0.29, 0.98, 0.63, 0.5, 0.55, 1.46, 2.81, 0.41, -0.16, 2.57, 0.44, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/0qWMjgpIECA_filtered.json b/annotations_filtered/0qWMjgpIECA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d8cf62771a9421fa42187f376e026cdeb856e53 --- /dev/null +++ b/annotations_filtered/0qWMjgpIECA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [3.0, 4.36], [7.0, 8.55], [10.0, 10.42], [11.0, 13.1], [20.0, 20.04], [22.0, 22.44], [24.0, 24.65], [29.0, 29.05], [42.0, 42.42], [43.0, 43.66], [45.0, 45.96], [49.0, 49.11], [50.0, 51.26], [62.0, 62.82], [65.0, 66.21], [73.0, 74.58], [75.0, 76.74], [82.0, 82.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.36, 1.55, 0.42, 2.1, 0.04, 0.44, 0.65, 0.05, 0.42, 0.66, 0.96, 0.11, 1.26, 0.82, 1.21, 1.58, 1.74, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/0qeD9nc9nwo_filtered.json b/annotations_filtered/0qeD9nc9nwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd062e68ed54864bee0e096cb3b2e3999c5e976 --- /dev/null +++ b/annotations_filtered/0qeD9nc9nwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [13.0, 13.54], [34.0, 34.48], [35.0, 35.51], [50.0, 51.48], [57.0, 58.5]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.83, 0.54, 0.48, 0.51, 1.48, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/0qkVyahL10U_filtered.json b/annotations_filtered/0qkVyahL10U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e42a0a98e841e7c0794846b0ef5a84f231666b6 --- /dev/null +++ b/annotations_filtered/0qkVyahL10U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [7.0, 8.68], [16.0, 16.26], [18.0, 18.5], [27.0, 27.7], [46.0, 46.82], [49.0, 50.5], [53.0, 54.99], [59.0, 59.98], [66.0, 66.5], [78.0, 78.75], [83.0, 84.54], [86.0, 87.07], [88.0, 89.11], [90.0, 90.29], [91.0, 92.2], [92.0, 94.12], [104.0, 104.19], [115.0, 115.92], [144.0, 160.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.69, 0.0, 0.0, 74.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.29], ["sine wave", 22.56], ["dial tone", 10.88]], null, null, null], "duration": [0.65, 1.68, 0.26, 0.5, 0.7, 0.82, 1.5, 1.99, 0.98, 0.5, 0.75, 1.54, 1.07, 1.11, 0.29, 1.2, 2.12, 0.19, 0.92, 16.95]} \ No newline at end of file diff --git a/annotations_filtered/0quxzV2i_gQ_filtered.json b/annotations_filtered/0quxzV2i_gQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2db3fbfb80c9d5f68980a7155c5d7446914fe3e --- /dev/null +++ b/annotations_filtered/0quxzV2i_gQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.91], [25.0, 26.0], [33.0, 35.88], [37.0, 38.21], [39.0, 39.36], [44.0, 44.58], [47.0, 47.61], [48.0, 49.03], [50.0, 50.36], [54.0, 54.63], [56.0, 56.88], [58.0, 58.83], [59.0, 59.43], [62.0, 62.18], [66.0, 66.29], [69.0, 70.06], [73.0, 73.38], [78.0, 79.47], [81.0, 82.39], [87.0, 101.92], [105.0, 112.95], [116.0, 117.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.01, 28.54, 0.0], "audiomae_on_audioset": [null, null, [["hum", 50.72], ["mains hum", 15.49], ["throbbing", 9.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 55.07], ["throbbing", 21.17], ["music", 8.92]], [["music", 82.25], ["beatboxing", 2.39], ["synthetic singing", 1.09]], null], "duration": [0.91, 1.0, 2.88, 1.21, 0.36, 0.58, 0.61, 1.03, 0.36, 0.63, 0.88, 0.83, 0.43, 0.18, 0.29, 1.06, 0.38, 1.47, 1.39, 14.92, 7.95, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/0qvpcfYFHcw_filtered.json b/annotations_filtered/0qvpcfYFHcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04a2af0cc5742ca01ff8c07e30c88c4749dc7de1 --- /dev/null +++ b/annotations_filtered/0qvpcfYFHcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.92], [2.0, 3.27], [5.0, 10.64], [12.0, 14.45], [15.0, 17.32], [19.0, 20.83], [22.0, 24.98], [28.0, 30.57], [35.0, 36.02], [38.0, 40.88], [43.0, 43.92], [45.0, 49.72], [52.0, 52.42], [54.0, 59.68], [61.0, 64.23], [65.0, 72.81], [73.0, 73.97], [75.0, 75.15], [76.0, 76.72], [89.0, 89.14], [92.0, 92.33], [98.0, 98.69], [106.0, 106.51], [110.0, 111.03], [115.0, 116.87], [118.0, 119.08], [120.0, 124.48], [126.0, 126.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 99.98, 88.1, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 99.78, 0.0, 100.0, 100.0, 51.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.27, 5.64, 2.45, 2.32, 1.83, 2.98, 2.57, 1.02, 2.88, 0.92, 4.72, 0.42, 5.68, 3.23, 7.81, 0.97, 0.15, 0.72, 0.14, 0.33, 0.69, 0.51, 1.03, 1.87, 1.08, 4.48, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/0qzRQ3qxv5Y_filtered.json b/annotations_filtered/0qzRQ3qxv5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61abea0fc1166cff88c756632cc6843419f6d436 --- /dev/null +++ b/annotations_filtered/0qzRQ3qxv5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.92], [10.0, 20.82], [24.0, 47.87], [50.0, 51.14], [53.0, 53.49], [60.0, 72.39], [74.0, 139.29]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [64.52, 33.6, 37.46, 0.0, 0.0, 50.41, 0.0], "audiomae_on_audioset": [null, [["music", 79.57], ["speech", 3.69], ["boing", 1.73]], [["music", 54.39], ["bird", 4.82], ["bird vocalization, bird call, bird song", 4.52]], null, null, null, null], "duration": [3.92, 10.82, 23.87, 1.14, 0.49, 12.39, 65.29]} \ No newline at end of file diff --git a/annotations_filtered/0rgfZzE6Ulg_filtered.json b/annotations_filtered/0rgfZzE6Ulg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5af4149270b9b2f7ba16dd4675f159127f36ecb --- /dev/null +++ b/annotations_filtered/0rgfZzE6Ulg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.37], [9.0, 9.09], [9.0, 9.19], [11.0, 11.42], [12.0, 15.65], [16.0, 19.23], [20.0, 20.98], [22.0, 22.92], [25.0, 27.04], [28.0, 29.12], [31.0, 32.07], [36.0, 37.3], [39.0, 41.84], [45.0, 46.85], [52.0, 53.18], [57.0, 57.86], [62.0, 63.1], [65.0, 68.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.91, 0.0, 0.0, 0.0, 100.0, 77.36, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.37, 0.09, 0.19, 0.42, 3.65, 3.23, 0.98, 0.92, 2.04, 1.12, 1.07, 1.3, 2.84, 1.85, 1.18, 0.86, 1.1, 3.98]} \ No newline at end of file diff --git a/annotations_filtered/0sNSVtTcxpo_filtered.json b/annotations_filtered/0sNSVtTcxpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ead823575289bc21e55710cc9997d4480c54fbc6 --- /dev/null +++ b/annotations_filtered/0sNSVtTcxpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [5.0, 6.98], [18.0, 19.09], [20.0, 20.61], [21.0, 23.36], [25.0, 29.78], [32.0, 33.08], [35.0, 36.22], [39.0, 43.06], [46.0, 57.33], [58.0, 66.07], [67.0, 74.49], [78.0, 83.56], [85.0, 89.24], [93.0, 94.39], [98.0, 99.42], [100.0, 101.85], [104.0, 107.18], [110.0, 116.67], [117.0, 118.56], [119.0, 119.74], [122.0, 122.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.53, 73.82, 0.0, 0.0, 96.89, 67.76, 72.6, 73.51, 50.06, 42.06, 0.0, 0.0, 0.0, 36.99, 43.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.91], ["speech", 20.81], ["effects unit", 7.59]], null, null, null, [["music", 45.06], ["theremin", 9.9], ["ambient music", 4.13]], [["music", 33.48], ["speech", 24.59], ["didgeridoo", 11.28]], null, null, null], "duration": [0.62, 1.98, 1.09, 0.61, 2.36, 4.78, 1.08, 1.22, 4.06, 11.33, 8.07, 7.49, 5.56, 4.24, 1.39, 1.42, 1.85, 3.18, 6.67, 1.56, 0.74, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/0sUHxfXKUas_filtered.json b/annotations_filtered/0sUHxfXKUas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..684b6e136e046a0d0ce618e9179c5b01c7e5a0e5 --- /dev/null +++ b/annotations_filtered/0sUHxfXKUas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.67], [11.0, 17.31], [18.0, 18.81], [22.0, 25.89], [27.0, 44.78], [46.0, 52.32], [53.0, 55.24], [57.0, 62.73], [63.0, 75.34], [77.0, 77.6], [80.0, 81.55], [86.0, 87.17], [88.0, 89.06], [90.0, 101.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.17, 0.0, 98.86, 93.76, 80.64, 98.86, 96.29, 79.24, 0.0, 0.0, 0.0, 0.0, 77.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 6.31, 0.81, 3.89, 17.78, 6.32, 2.24, 5.73, 12.34, 0.6, 1.55, 1.17, 1.06, 11.46]} \ No newline at end of file diff --git a/annotations_filtered/0sdIO3lVTWE_filtered.json b/annotations_filtered/0sdIO3lVTWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09e2131bc18a6fabf28fbd9573f43cc5206e8723 --- /dev/null +++ b/annotations_filtered/0sdIO3lVTWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 47.09], [60.0, 61.08], [69.0, 73.04], [75.0, 78.93], [81.0, 81.43], [83.0, 87.74], [88.0, 89.21]], "keep_status": [false, false, true, true, false, false, false], "silence_prob": [35.26, 0.0, 35.69, 34.85, 0.0, 37.61, 0.0], "audiomae_on_audioset": [[["hum", 34.39], ["music", 32.84], ["mains hum", 20.6]], null, [["speech", 30.58], ["music", 17.76], ["boing", 15.87]], [["music", 59.52], ["synthesizer", 4.69], ["musical instrument", 3.95]], null, [["noise", 74.39], ["music", 3.49], ["groan", 2.37]], null], "duration": [20.09, 1.08, 4.04, 3.93, 0.43, 4.74, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/0t1xR1LX5Kg_filtered.json b/annotations_filtered/0t1xR1LX5Kg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..099834f18e367bc9f3b1eaff5fcf0f77d3c60fbe --- /dev/null +++ b/annotations_filtered/0t1xR1LX5Kg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.47], [20.0, 20.8], [22.0, 32.46], [34.0, 35.4], [37.0, 37.35], [39.0, 43.04], [44.0, 45.1], [49.0, 48.78], [51.0, 55.46], [57.0, 56.93], [58.0, 59.14], [69.0, 69.62], [70.0, 90.49]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.31, 0.0, 42.13, 0.0, 0.0, 42.35, 0.0, 0.0, 41.07, 0.0, 0.0, 0.0, 31.08], "audiomae_on_audioset": [[["hum", 30.48], ["throbbing", 20.57], ["music", 14.51]], null, [["music", 67.86], ["musical instrument", 5.17], ["synthesizer", 2.7]], null, null, [["music", 19.76], ["hum", 15.2], ["throbbing", 11.05]], null, null, [["hum", 36.95], ["throbbing", 24.33], ["mains hum", 14.38]], null, null, null, [["music", 48.09], ["didgeridoo", 30.68], ["synthesizer", 4.92]]], "duration": [6.47, 0.8, 10.46, 1.4, 0.35, 4.04, 1.1, -0.22, 4.46, -0.07, 1.14, 0.62, 20.49]} \ No newline at end of file diff --git a/annotations_filtered/0t6IIdmOIOQ_filtered.json b/annotations_filtered/0t6IIdmOIOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..043e506f6d066e8bfe63609eae563b4c08921f50 --- /dev/null +++ b/annotations_filtered/0t6IIdmOIOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.4], [12.0, 16.9], [19.0, 20.75], [21.0, 20.82], [21.0, 22.71], [26.0, 27.09], [27.0, 32.0], [34.0, 36.44], [38.0, 39.82], [41.0, 43.02], [44.0, 45.54], [48.0, 48.86], [51.0, 53.86], [55.0, 56.66], [57.0, 57.1], [58.0, 58.94], [60.0, 60.99], [63.0, 64.54], [65.0, 66.87], [68.0, 68.13], [69.0, 70.38], [72.0, 73.03], [74.0, 74.76], [81.0, 82.19], [83.0, 83.24], [84.0, 85.4], [89.0, 91.69], [93.0, 93.18], [95.0, 95.54], [100.0, 104.77], [105.0, 106.59], [108.0, 109.95], [111.0, 114.47], [117.0, 119.3], [121.0, 123.72], [125.0, 127.57], [128.0, 130.87], [131.0, 135.14], [135.0, 141.02], [142.0, 141.94], [143.0, 145.54], [146.0, 150.31], [152.0, 154.77], [156.0, 157.38], [163.0, 164.02], [166.0, 171.07], [172.0, 174.12]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 51.39, 98.44, 0.0, 43.82, 0.0, 0.0, 42.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 62.68, 0.0, 0.0, 94.52, 95.51, 99.59, 98.19, 59.59, 91.81, 69.47, 0.0, 90.08, 92.8, 94.81, 0.0, 0.0, 98.66, 43.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 17.63], ["speech", 16.99], ["mosquito", 13.1]], null, null, [["speech", 59.59], ["insect", 7.37], ["frog", 4.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.39], ["dial tone", 6.98], ["sidetone", 4.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.04], ["sidetone", 8.42], ["livestock, farm animals, working animals", 5.33]]], "duration": [1.4, 4.9, 1.75, -0.18, 1.71, 1.09, 5.0, 2.44, 1.82, 2.02, 1.54, 0.86, 2.86, 1.66, 0.1, 0.94, 0.99, 1.54, 1.87, 0.13, 1.38, 1.03, 0.76, 1.19, 0.24, 1.4, 2.69, 0.18, 0.54, 4.77, 1.59, 1.95, 3.47, 2.3, 2.72, 2.57, 2.87, 4.14, 6.02, -0.06, 2.54, 4.31, 2.77, 1.38, 1.02, 5.07, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/0tN0uV9DebQ_filtered.json b/annotations_filtered/0tN0uV9DebQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d711c323754ff6098b09890944a8e4b2b770d5e --- /dev/null +++ b/annotations_filtered/0tN0uV9DebQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.67], [9.0, 10.94], [12.0, 12.88], [22.0, 22.64], [32.0, 32.86], [37.0, 37.3], [40.0, 41.34], [42.0, 43.09], [46.0, 46.68], [61.0, 62.04], [79.0, 82.0], [83.0, 84.86], [87.0, 93.21], [96.0, 96.04], [101.0, 102.27], [104.0, 105.22], [107.0, 107.96], [110.0, 119.96], [121.0, 123.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.36, 0.0, 30.29, 0.0, 0.0, 0.0, 0.0, 29.63, 32.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 25.77], ["music", 13.99], ["speech", 4.72]], null, [["speech", 55.95], ["sidetone", 4.18], ["music", 4.04]], null, null, null, null, [["music", 24.18], ["grunt", 11.91], ["groan", 9.53]], [["music", 32.16], ["reverberation", 17.02], ["theremin", 4.51]]], "duration": [1.67, 1.94, 0.88, 0.64, 0.86, 0.3, 1.34, 1.09, 0.68, 1.04, 3.0, 1.86, 6.21, 0.04, 1.27, 1.22, 0.96, 9.96, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/0tRSAQUheo0_filtered.json b/annotations_filtered/0tRSAQUheo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e3aff461cce5f796f230462cfec24bfe4bacff8 --- /dev/null +++ b/annotations_filtered/0tRSAQUheo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [10.0, 13.61], [14.0, 20.22], [21.0, 26.28], [27.0, 36.68], [37.0, 36.8], [38.0, 39.26], [41.0, 47.55], [48.0, 67.05], [67.0, 78.58], [80.0, 89.92], [91.0, 95.57], [97.0, 103.42], [104.0, 106.71]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.98, 43.56, 58.13, 52.98, 0.0, 0.0, 100.0, 69.88, 99.97, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, [["speech", 63.7], ["crushing", 15.29], ["crackle", 5.45]], [["heart sounds, heartbeat", 25.92], ["speech", 18.23], ["throbbing", 13.13]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 3.61, 6.22, 5.28, 9.68, -0.2, 1.26, 6.55, 19.05, 11.58, 9.92, 4.57, 6.42, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/0tjKGAwyCIY_filtered.json b/annotations_filtered/0tjKGAwyCIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..621b93f5994b994a3f2b2f9b65be1e1960505e7a --- /dev/null +++ b/annotations_filtered/0tjKGAwyCIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [7.0, 7.28], [9.0, 8.85], [10.0, 10.12], [14.0, 17.1], [33.0, 34.45], [41.0, 42.16], [51.0, 51.87], [54.0, 54.36], [74.0, 75.84], [78.0, 78.61], [94.0, 95.23], [100.0, 100.11], [102.0, 102.66], [104.0, 106.25], [108.0, 108.82], [116.0, 116.31], [118.0, 119.08], [121.0, 123.3], [124.0, 124.88], [125.0, 126.39], [129.0, 131.52], [134.0, 134.82], [137.0, 137.79], [140.0, 140.05], [143.0, 143.56], [144.0, 148.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 36.8, 0.0, 0.0, 36.83, 0.0, 0.0, 0.0, 0.0, 46.97], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 53.6], ["hum", 9.56], ["speech", 4.13]], null, null, null, null, null, null, null, null, null, [["music", 51.79], ["speech", 14.94], ["synthesizer", 2.66]], null, null, null, [["music", 55.28], ["synthesizer", 9.75], ["throbbing", 8.65]], null, null, [["music", 60.42], ["throbbing", 4.63], ["synthesizer", 3.88]], null, null, null, null, [["music", 34.21], ["hum", 7.64], ["synthesizer", 7.46]]], "duration": [0.56, 0.28, -0.15, 0.12, 3.1, 1.45, 1.16, 0.87, 0.36, 1.84, 0.61, 1.23, 0.11, 0.66, 2.25, 0.82, 0.31, 1.08, 2.3, 0.88, 1.39, 2.52, 0.82, 0.79, 0.05, 0.56, 4.68]} \ No newline at end of file diff --git a/annotations_filtered/0tnKF_qcXTo_filtered.json b/annotations_filtered/0tnKF_qcXTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41f3ebe950caf836be0ba4031a36d6ea5553bd04 --- /dev/null +++ b/annotations_filtered/0tnKF_qcXTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 88.23], [91.0, 126.84], [130.0, 171.29], [174.0, 187.96], [189.0, 189.46], [191.0, 191.81], [195.0, 201.07]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [30.05, 0.0, 0.0, 28.74, 0.0, 0.0, 30.24], "audiomae_on_audioset": [[["music", 39.56], ["throbbing", 30.89], ["hum", 16.81]], null, null, [["music", 71.58], ["throbbing", 5.63], ["speech", 5.42]], null, null, [["music", 33.03], ["throbbing", 11.89], ["hum", 9.66]]], "duration": [28.23, 35.84, 41.29, 13.96, 0.46, 0.81, 6.07]} \ No newline at end of file diff --git a/annotations_filtered/0tq44zxA0Ao_filtered.json b/annotations_filtered/0tq44zxA0Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1d7949963934d4dbbe2352191e8e82578f1064d --- /dev/null +++ b/annotations_filtered/0tq44zxA0Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.58], [12.0, 13.05], [17.0, 18.12], [22.0, 22.47], [25.0, 25.76], [28.0, 29.2], [30.0, 31.04], [32.0, 33.17], [34.0, 35.85], [39.0, 42.03], [46.0, 46.43], [54.0, 55.31], [57.0, 57.06], [59.0, 62.41], [64.0, 108.73], [116.0, 117.49], [121.0, 124.06], [124.0, 125.51], [127.0, 129.07], [131.0, 132.73], [137.0, 139.87], [143.0, 146.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 51.39, 0.0, 40.79, 0.0, 47.46, 37.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.94], ["speech", 17.71], ["hum", 4.19]], null, [["music", 65.83], ["didgeridoo", 15.44], ["hum", 3.28]], [["music", 41.99], ["speech", 20.45], ["slap, smack", 3.84]]], "duration": [1.58, 1.05, 1.12, 0.47, 0.76, 1.2, 1.04, 1.17, 1.85, 3.03, 0.43, 1.31, 0.06, 3.41, 44.73, 1.49, 3.06, 1.51, 2.07, 1.73, 2.87, 3.18]} \ No newline at end of file diff --git a/annotations_filtered/0tro-o0fOk4_filtered.json b/annotations_filtered/0tro-o0fOk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac6c9db7d9377fc26ce8d8c2efd1ea3fae1f3323 --- /dev/null +++ b/annotations_filtered/0tro-o0fOk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 19.97], [22.0, 24.27], [27.0, 27.94], [30.0, 30.32], [33.0, 34.33], [37.0, 37.94], [39.0, 40.07], [41.0, 43.23], [46.0, 47.44], [49.0, 49.65], [51.0, 52.68], [56.0, 57.37], [59.0, 59.81], [60.0, 71.29], [72.0, 77.21], [78.0, 82.65], [85.0, 90.66], [91.0, 92.74], [99.0, 99.62], [101.0, 101.87], [103.0, 106.73], [109.0, 111.99], [113.0, 131.13]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [41.26, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 38.03, 0.0, 0.0, 0.0, 0.0, 0.0, 40.93, 39.46, 46.05, 44.6, 0.0, 0.0, 0.0, 36.03, 49.45, 29.95], "audiomae_on_audioset": [[["hum", 19.31], ["walk, footsteps", 16.1], ["music", 13.78]], [["music", 53.13], ["speech", 8.11], ["hum", 7.55]], null, null, null, null, null, [["music", 58.41], ["gong", 10.42], ["synthesizer", 3.19]], null, null, null, null, null, [["music", 69.42], ["speech", 7.34], ["chirp tone", 2.95]], [["music", 46.58], ["speech", 21.5], ["beep, bleep", 4.58]], [["music", 78.64], ["synthesizer", 3.43], ["ambient music", 2.28]], [["music", 72.99], ["speech", 12.18], ["bass guitar", 2.02]], null, null, null, [["music", 68.04], ["guitar", 5.46], ["musical instrument", 4.75]], [["music", 31.07], ["alarm clock", 22.59], ["gong", 10.78]], [["music", 83.66], ["throbbing", 2.47], ["cacophony", 1.59]]], "duration": [10.97, 2.27, 0.94, 0.32, 1.33, 0.94, 1.07, 2.23, 1.44, 0.65, 1.68, 1.37, 0.81, 11.29, 5.21, 4.65, 5.66, 1.74, 0.62, 0.87, 3.73, 2.99, 18.13]} \ No newline at end of file diff --git a/annotations_filtered/0u0SEECyGlM_filtered.json b/annotations_filtered/0u0SEECyGlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a884838768b806cbf7ae135ba97f72de853022e --- /dev/null +++ b/annotations_filtered/0u0SEECyGlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 56.54], [61.0, 86.36], [88.0, 89.8]], "keep_status": [true, true, false], "silence_prob": [36.12, 36.52, 0.0], "audiomae_on_audioset": [[["hum", 23.53], ["mains hum", 13.22], ["music", 11.77]], [["music", 25.25], ["cacophony", 15.4], ["buzz", 7.09]], null], "duration": [27.54, 25.36, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/0u5O2--9www_filtered.json b/annotations_filtered/0u5O2--9www_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58bd6ef33720aa7c1b90c06aa60e8494997d5f6c --- /dev/null +++ b/annotations_filtered/0u5O2--9www_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.52], [4.0, 4.94], [5.0, 5.81], [9.0, 9.04], [10.0, 10.88], [13.0, 13.91], [17.0, 17.78], [22.0, 22.84], [25.0, 26.0], [27.0, 27.92], [28.0, 28.98], [29.0, 29.57], [32.0, 48.3], [60.0, 60.12], [63.0, 70.06], [71.0, 71.98], [73.0, 73.6], [74.0, 74.51], [77.0, 77.09], [92.0, 94.36], [96.0, 96.53], [99.0, 99.55], [100.0, 100.82], [104.0, 105.06], [109.0, 111.03], [113.0, 113.17], [116.0, 116.26], [118.0, 119.13], [126.0, 126.52], [130.0, 138.33], [141.0, 142.2], [144.0, 145.18], [148.0, 149.47], [149.0, 149.5], [150.0, 150.74], [158.0, 159.9]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99, 0.0, 43.71, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 40.97], ["radio", 9.84], ["fly, housefly", 2.6]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.49], ["music", 27.77], ["hubbub, speech noise, speech babble", 2.44]], null, [["glass", 42.4], ["speech", 29.48], ["smash, crash", 4.46]], null, null, null, null, null, null, null, null, null, [["speech", 54.24], ["dial tone", 5.12], ["sidetone", 4.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.52, 0.94, 0.81, 0.04, 0.88, 0.91, 0.78, 0.84, 1.0, 0.92, 0.98, 0.57, 16.3, 0.12, 7.06, 0.98, 0.6, 0.51, 0.09, 2.36, 0.53, 0.55, 0.82, 1.06, 2.03, 0.17, 0.26, 1.13, 0.52, 8.33, 1.2, 1.18, 1.47, 0.5, 0.74, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/0uSOiu_WUDw_filtered.json b/annotations_filtered/0uSOiu_WUDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e19f87e7a9f88174a56702bcbf11e0412a42ccd9 --- /dev/null +++ b/annotations_filtered/0uSOiu_WUDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.72], [13.0, 14.79], [15.0, 26.27], [28.0, 33.45], [34.0, 40.8], [42.0, 43.43], [45.0, 47.21], [51.0, 51.06], [58.0, 59.14], [64.0, 64.18], [65.0, 68.79], [76.0, 76.11], [80.0, 85.83], [87.0, 89.45], [92.0, 92.18], [93.0, 93.72], [95.0, 96.58], [97.0, 99.13], [106.0, 106.57], [108.0, 108.75], [111.0, 112.99], [116.0, 116.16]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 29.21, 28.67, 32.6, 0.0, 54.97, 0.0, 0.0, 0.0, 29.68, 0.0, 31.79, 50.11, 0.0, 0.0, 0.0, 37.77, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["electric shaver, electric razor", 24.68], ["music", 19.49], ["speech", 9.48]], [["speech", 33.65], ["hum", 9.69], ["thump, thud", 6.68]], [["speech", 43.35], ["sidetone", 12.59], ["music", 6.54]], null, null, null, null, null, [["speech", 63.87], ["boing", 7.24], ["snicker", 3.91]], null, [["speech", 71.63], ["music", 8.12], ["speech synthesizer", 4.75]], null, null, null, null, [["music", 42.28], ["speech", 21.88], ["whale vocalization", 2.86]], null, null, null, null], "duration": [-0.28, 1.79, 11.27, 5.45, 6.8, 1.43, 2.21, 0.06, 1.14, 0.18, 3.79, 0.11, 5.83, 2.45, 0.18, 0.72, 1.58, 2.13, 0.57, 0.75, 1.99, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/0uyVs4iKp_E_filtered.json b/annotations_filtered/0uyVs4iKp_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dab0425dfb968ffe53698346f645361952bbc35 --- /dev/null +++ b/annotations_filtered/0uyVs4iKp_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 69.74], [71.0, 71.91], [73.0, 77.8], [80.0, 82.05], [83.0, 84.94], [85.0, 86.09], [87.0, 88.91], [90.0, 106.08], [107.0, 201.95], [204.0, 220.68], [221.0, 225.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.85, 98.44, 0.0, 0.0, 0.0, 66.63, 0.0, 78.89, 74.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [63.74, 0.91, 4.8, 2.05, 1.94, 1.09, 1.91, 16.08, 94.95, 16.68, 4.96]} \ No newline at end of file diff --git a/annotations_filtered/0v74ANWBqv0_filtered.json b/annotations_filtered/0v74ANWBqv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d29c31140087a91651e075d8e27bbba94b3a7a2 --- /dev/null +++ b/annotations_filtered/0v74ANWBqv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.49], [17.0, 18.67], [21.0, 21.88], [25.0, 49.54], [50.0, 50.14], [50.0, 50.43], [52.0, 52.29], [53.0, 58.55], [59.0, 60.18], [65.0, 65.43], [68.0, 69.06], [72.0, 81.18], [82.0, 89.51], [90.0, 102.47], [104.0, 113.81], [115.0, 116.73], [118.0, 145.52], [149.0, 151.26], [152.0, 157.22], [159.0, 162.57], [164.0, 164.0], [164.0, 195.32], [196.0, 196.4]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.62, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 42.26, 45.43, 31.1, 28.53, 0.0, 28.15, 28.44, 28.55, 29.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.59], ["throbbing", 22.15], ["hum", 10.52]], null, null, null, [["hum", 29.58], ["mains hum", 27.09], ["music", 11.23]], null, null, null, [["music", 29.6], ["hum", 22.46], ["mains hum", 10.37]], [["music", 42.72], ["hum", 15.82], ["mains hum", 11.56]], [["music", 76.18], ["ambient music", 4.78], ["synthesizer", 3.53]], [["music", 75.01], ["rumble", 6.31], ["mains hum", 2.82]], null, [["hum", 45.87], ["music", 13.24], ["throbbing", 6.86]], [["sound effect", 10.6], ["music", 8.93], ["speech", 7.01]], [["music", 25.58], ["mains hum", 21.21], ["hum", 14.7]], [["throbbing", 26.43], ["hum", 24.62], ["music", 13.78]], null, null, null], "duration": [1.49, 1.67, 0.88, 24.54, 0.14, 0.43, 0.29, 5.55, 1.18, 0.43, 1.06, 9.18, 7.51, 12.47, 9.81, 1.73, 27.52, 2.26, 5.22, 3.57, 0.0, 31.32, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/0v7Ea7kg2gA_filtered.json b/annotations_filtered/0v7Ea7kg2gA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfad29851873804732bd8b6816c5aab420d0e8a3 --- /dev/null +++ b/annotations_filtered/0v7Ea7kg2gA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.09], [25.0, 25.42], [28.0, 28.88], [30.0, 30.87], [31.0, 31.89], [36.0, 39.36], [46.0, 46.03], [48.0, 47.78], [54.0, 54.53], [56.0, 56.19], [69.0, 69.28], [71.0, 71.79], [74.0, 74.19], [75.0, 75.93], [77.0, 77.77], [82.0, 85.87], [87.0, 99.35], [100.0, 100.72], [104.0, 114.67], [116.0, 117.39], [126.0, 127.14]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.15, 33.84, 0.0, 36.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["ping", 43.07], ["hum", 7.85], ["speech", 7.53]], null, null, null, null, null, null, null, null, null, [["explosion", 23.48], ["speech", 9.11], ["eruption", 7.06]], [["speech", 58.45], ["sidetone", 7.75], ["noise", 6.97]], null, [["bouncing", 63.39], ["music", 6.88], ["speech", 4.41]], null, null], "duration": [0.09, 0.42, 0.88, 0.87, 0.89, 3.36, 0.03, -0.22, 0.53, 0.19, 0.28, 0.79, 0.19, 0.93, 0.77, 3.87, 12.35, 0.72, 10.67, 1.39, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/0vOulnDhH8A_filtered.json b/annotations_filtered/0vOulnDhH8A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..157f01400c736e15000eaded3589bd5ef2fb0167 --- /dev/null +++ b/annotations_filtered/0vOulnDhH8A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.02], [2.0, 3.35], [4.0, 8.61], [16.0, 15.96], [16.0, 21.47], [24.0, 24.56], [27.0, 28.9], [31.0, 30.87], [36.0, 36.59], [39.0, 39.65], [40.0, 41.05], [43.0, 44.44], [48.0, 64.3], [64.0, 77.48], [78.0, 79.98], [80.0, 118.45], [119.0, 120.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 32.85, 0.0, 36.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.91, 36.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["theremin", 44.31], ["music", 32.2], ["speech", 10.01]], null, [["theremin", 58.47], ["music", 23.47], ["musical instrument", 4.6]], null, null, null, null, null, null, null, [["vehicle", 22.23], ["white noise", 9.51], ["car", 8.48]], [["speech", 39.63], ["cattle, bovinae", 11.61], ["moo", 9.28]], null, null, null], "duration": [1.02, 1.35, 4.61, -0.04, 5.47, 0.56, 1.9, -0.13, 0.59, 0.65, 1.05, 1.44, 16.3, 13.48, 1.98, 38.45, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/0vVy9NBehoc_filtered.json b/annotations_filtered/0vVy9NBehoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..763d07aacdbc0a4b47fc21a288c6b8ab2db30f59 --- /dev/null +++ b/annotations_filtered/0vVy9NBehoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.9], [13.0, 13.07], [17.0, 21.66], [25.0, 32.19], [38.0, 38.85], [41.0, 50.94], [55.0, 54.78], [64.0, 64.37], [75.0, 76.59], [78.0, 78.81], [80.0, 81.03], [88.0, 95.66]], "keep_status": [false, false, true, true, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.38, 41.42, 0.0, 36.46, 0.0, 0.0, 0.0, 0.0, 0.0, 35.33], "audiomae_on_audioset": [null, null, [["throbbing", 20.04], ["hum", 18.33], ["music", 16.52]], [["music", 31.25], ["livestock, farm animals, working animals", 23.88], ["cattle, bovinae", 5.34]], null, [["music", 57.15], ["speech", 5.53], ["shofar", 3.85]], null, null, null, null, null, [["music", 18.63], ["speech", 14.32], ["fly, housefly", 6.77]]], "duration": [0.9, 0.07, 4.66, 7.19, 0.85, 9.94, -0.22, 0.37, 1.59, 0.81, 1.03, 7.66]} \ No newline at end of file diff --git a/annotations_filtered/0vcXvLUt1E4_filtered.json b/annotations_filtered/0vcXvLUt1E4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8b2ea9dd4755c3f9e9a98ac5e40eb75f1c84f4 --- /dev/null +++ b/annotations_filtered/0vcXvLUt1E4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [8.0, 9.64]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.73, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/0vlBQqEc5YA_filtered.json b/annotations_filtered/0vlBQqEc5YA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fccb1cfe557e63f060f5e7bdc0dad186b7868474 --- /dev/null +++ b/annotations_filtered/0vlBQqEc5YA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.02], [3.0, 3.23], [14.0, 15.63], [17.0, 17.69], [18.0, 19.68], [21.0, 22.5], [23.0, 28.81], [31.0, 31.55], [34.0, 33.96], [35.0, 35.88], [37.0, 42.04], [43.0, 45.22], [49.0, 51.83], [54.0, 84.35], [85.0, 89.73], [94.0, 98.29], [99.0, 108.13], [109.0, 126.13]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.37, 0.0, 0.0, 0.0, 38.71, 42.74, 60.05, 0.0, 34.36, 34.98, 38.09, 31.65], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 36.18], ["theremin", 11.72], ["hum", 10.35]], null, null, null, [["music", 25.84], ["hum", 23.62], ["speech", 18.27]], [["speech", 24.72], ["hum", 19.36], ["music", 18.13]], null, null, [["music", 39.13], ["hum", 20.93], ["mains hum", 12.65]], [["music", 28.25], ["theremin", 15.5], ["speech", 11.23]], [["music", 23.16], ["speech", 22.16], ["whale vocalization", 17.06]], [["music", 35.43], ["hum", 19.58], ["speech", 11.88]]], "duration": [1.02, 0.23, 1.63, 0.69, 1.68, 1.5, 5.81, 0.55, -0.04, 0.88, 5.04, 2.22, 2.83, 30.35, 4.73, 4.29, 9.13, 17.13]} \ No newline at end of file diff --git a/annotations_filtered/0vtLA9LFkSs_filtered.json b/annotations_filtered/0vtLA9LFkSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53e74be31065c0a482ebaf2b67f4ce54b82f33a7 --- /dev/null +++ b/annotations_filtered/0vtLA9LFkSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 51.63], [53.0, 71.83], [73.0, 73.85], [75.0, 96.21], [97.0, 108.82]], "keep_status": [false, true, false, true, false], "silence_prob": [0.0, 29.36, 0.0, 29.1, 29.75], "audiomae_on_audioset": [null, [["speech", 27.96], ["music", 9.17], ["hum", 9.08]], null, [["music", 48.88], ["speech", 14.54], ["whack, thwack", 4.53]], [["speech", 50.33], ["music", 17.08], ["whack, thwack", 6.71]]], "duration": [46.63, 18.83, 0.85, 21.21, 11.82]} \ No newline at end of file diff --git a/annotations_filtered/0w8oeXvLXOw_filtered.json b/annotations_filtered/0w8oeXvLXOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c6b19c9353c13cbcb81d8ea93f3efc0815008b --- /dev/null +++ b/annotations_filtered/0w8oeXvLXOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.31], [23.0, 37.44], [42.0, 42.55], [44.0, 58.06], [60.0, 60.05], [60.0, 60.08], [60.0, 60.12], [60.0, 76.05], [77.0, 77.75], [78.0, 105.26], [107.0, 106.96], [109.0, 138.4], [140.0, 153.05], [155.0, 155.63], [156.0, 156.56]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.86, 29.4, 0.0, 28.73, 0.0, 0.0, 0.0, 29.12, 0.0, 28.68, 0.0, 28.58, 29.56, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 52.0], ["music", 29.69], ["hum", 9.24]], [["throbbing", 28.73], ["hum", 17.56], ["music", 17.52]], null, [["hum", 51.28], ["mains hum", 29.45], ["music", 10.42]], null, null, null, [["hum", 57.55], ["throbbing", 22.29], ["mains hum", 17.84]], null, [["music", 38.9], ["throbbing", 17.56], ["hum", 8.82]], null, [["music", 40.68], ["throbbing", 24.72], ["hum", 13.63]], [["throbbing", 48.65], ["hum", 26.97], ["music", 9.69]], null, null], "duration": [9.31, 14.44, 0.55, 14.06, 0.05, 0.08, 0.12, 16.05, 0.75, 27.26, -0.04, 29.4, 13.05, 0.63, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/0wAtjDAyv4M_filtered.json b/annotations_filtered/0wAtjDAyv4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0991f8abad27e41077af8e535cc9441c10c2c348 --- /dev/null +++ b/annotations_filtered/0wAtjDAyv4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.34], [19.0, 20.56], [24.0, 45.98], [47.0, 62.83], [64.0, 67.34], [80.0, 82.32], [101.0, 103.55], [106.0, 106.95], [109.0, 110.39], [112.0, 113.0], [114.0, 114.61], [116.0, 117.64], [119.0, 120.31], [121.0, 123.47], [126.0, 126.76], [130.0, 130.44]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.79, 50.26, 39.72, 45.98, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fart", 33.62], ["speech", 23.72], ["whack, thwack", 4.63]], null, [["speech", 59.35], ["fly, housefly", 5.11], ["radio", 3.81]], [["speech", 35.68], ["radio", 23.06], ["fly, housefly", 11.18]], null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 1.56, 21.98, 15.83, 3.34, 2.32, 2.55, 0.95, 1.39, 1.0, 0.61, 1.64, 1.31, 2.47, 0.76, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/0wC8Ab5AZeE_filtered.json b/annotations_filtered/0wC8Ab5AZeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bb536319dc2779a67c0dd66d58b48639e33f251 --- /dev/null +++ b/annotations_filtered/0wC8Ab5AZeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.45], [13.0, 13.64], [16.0, 17.32], [20.0, 21.3], [24.0, 25.93], [31.0, 31.6], [40.0, 40.64], [42.0, 42.69], [43.0, 44.61], [47.0, 47.9], [55.0, 56.42], [63.0, 64.49], [67.0, 68.77], [70.0, 73.18], [75.0, 75.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.64, 1.32, 1.3, 1.93, 0.6, 0.64, 0.69, 1.61, 0.9, 1.42, 1.49, 1.77, 3.18, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/0wFkRRILnPo_filtered.json b/annotations_filtered/0wFkRRILnPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b7dd19b00d91db92976b93b9de7b3b915c691a5 --- /dev/null +++ b/annotations_filtered/0wFkRRILnPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.33], [6.0, 6.56], [8.0, 9.31], [10.0, 10.34], [12.0, 12.16], [14.0, 16.63], [17.0, 18.28], [20.0, 19.89], [21.0, 21.3], [22.0, 22.79], [25.0, 27.18], [31.0, 33.93], [36.0, 36.31], [37.0, 37.37], [38.0, 38.79], [40.0, 41.27], [42.0, 43.39], [44.0, 45.81], [46.0, 47.7], [49.0, 56.96], [58.0, 81.04], [83.0, 83.56], [85.0, 86.44], [88.0, 89.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 58.13, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 93.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.33, 0.56, 1.31, 0.34, 0.16, 2.63, 1.28, -0.11, 0.3, 0.79, 2.18, 2.93, 0.31, 0.37, 0.79, 1.27, 1.39, 1.81, 1.7, 7.96, 23.04, 0.56, 1.44, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/0wMU9XDIm4g_filtered.json b/annotations_filtered/0wMU9XDIm4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8c06ed0bc7a624a78c0a3223fba660d8e55ead9 --- /dev/null +++ b/annotations_filtered/0wMU9XDIm4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 18.5], [30.0, 30.55], [34.0, 41.94], [44.0, 55.83], [60.0, 70.88], [72.0, 73.95], [76.0, 84.97], [88.0, 89.82], [93.0, 101.55], [102.0, 103.17], [104.0, 109.98]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [32.51, 0.0, 29.16, 30.47, 30.12, 0.0, 49.22, 0.0, 54.97, 0.0, 62.58], "audiomae_on_audioset": [[["music", 61.65], ["synthesizer", 7.02], ["hum", 5.96]], null, [["music", 19.03], ["throbbing", 16.11], ["hum", 15.57]], [["music", 30.74], ["hum", 27.15], ["throbbing", 18.15]], [["music", 71.52], ["theremin", 11.21], ["musical instrument", 5.1]], null, [["music", 59.75], ["theremin", 9.83], ["synthesizer", 5.27]], null, null, null, null], "duration": [10.5, 0.55, 7.94, 11.83, 10.88, 1.95, 8.97, 1.82, 8.55, 1.17, 5.98]} \ No newline at end of file diff --git a/annotations_filtered/0wTKzzRtGqY_filtered.json b/annotations_filtered/0wTKzzRtGqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a55e8b10af1d6fe54ab1e04abc0171ab5b335e4 --- /dev/null +++ b/annotations_filtered/0wTKzzRtGqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.62], [17.0, 29.46], [36.0, 38.26], [39.0, 40.37], [41.0, 45.0], [47.0, 47.92], [50.0, 50.53], [52.0, 52.25], [55.0, 55.66], [57.0, 57.89], [60.0, 60.29], [61.0, 61.92], [64.0, 63.91], [66.0, 66.83], [78.0, 78.0], [81.0, 80.99], [82.0, 83.93], [87.0, 90.48], [91.0, 91.84], [93.0, 93.34], [95.0, 95.76], [97.0, 98.25], [99.0, 99.98], [101.0, 101.9], [105.0, 110.93], [112.0, 112.87], [116.0, 115.74], [122.0, 122.13], [125.0, 125.68], [126.0, 127.55], [129.0, 130.92], [133.0, 133.44], [135.0, 135.5], [138.0, 137.79], [140.0, 142.5], [144.0, 144.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.56, 86.82, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.21], ["insect", 13.62], ["fly, housefly", 7.51]], null, null, null, null, null, null, null, null, null, [["sidetone", 40.87], ["speech", 23.08], ["hum", 9.68]], null], "duration": [0.62, 12.46, 2.26, 1.37, 4.0, 0.92, 0.53, 0.25, 0.66, 0.89, 0.29, 0.92, -0.09, 0.83, 0.0, -0.01, 1.93, 3.48, 0.84, 0.34, 0.76, 1.25, 0.98, 0.9, 5.93, 0.87, -0.26, 0.13, 0.68, 1.55, 1.92, 0.44, 0.5, -0.21, 2.5, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/0wVgg5t2LAM_filtered.json b/annotations_filtered/0wVgg5t2LAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e70301acc71070e3a558e9173eae3a8e449b68fd --- /dev/null +++ b/annotations_filtered/0wVgg5t2LAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [5.0, 5.95], [7.0, 10.72], [19.0, 18.91], [24.0, 24.97], [26.0, 27.46], [28.0, 28.46], [29.0, 30.06], [36.0, 36.71], [44.0, 44.49], [55.0, 57.4], [58.0, 60.62], [62.0, 63.0], [75.0, 81.99]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 78.38, 0.0, 72.75], "audiomae_on_audioset": [null, null, [["fart", 42.77], ["speech", 12.5], ["whack, thwack", 7.88]], null, null, null, null, null, null, null, [["speech", 37.0], ["fly, housefly", 16.16], ["insect", 14.33]], null, null, null], "duration": [0.12, 0.95, 3.72, -0.09, 0.97, 1.46, 0.46, 1.06, 0.71, 0.49, 2.4, 2.62, 1.0, 6.99]} \ No newline at end of file diff --git a/annotations_filtered/0wngG1BlZNI_filtered.json b/annotations_filtered/0wngG1BlZNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f79f845d7b86527159ef25715b2d04cd12bb6ae6 --- /dev/null +++ b/annotations_filtered/0wngG1BlZNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [9.0, 11.37], [12.0, 12.68], [13.0, 13.42], [14.0, 14.96], [16.0, 17.24], [20.0, 19.74], [21.0, 21.19], [24.0, 27.92], [29.0, 29.54], [30.0, 30.81], [38.0, 40.04], [51.0, 52.05], [56.0, 55.88], [58.0, 58.46], [62.0, 63.59], [66.0, 66.46], [68.0, 68.01], [76.0, 76.38], [81.0, 80.84], [83.0, 84.86], [86.0, 89.48], [94.0, 95.37], [100.0, 101.44], [112.0, 112.18], [112.0, 112.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 2.37, 0.68, 0.42, 0.96, 1.24, -0.26, 0.19, 3.92, 0.54, 0.81, 2.04, 1.05, -0.12, 0.46, 1.59, 0.46, 0.01, 0.38, -0.16, 1.86, 3.48, 1.37, 1.44, 0.18, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/0x05PrIasjk_filtered.json b/annotations_filtered/0x05PrIasjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ed15e2082c8f2ea1e6e1eee7a45d624e16ac048 --- /dev/null +++ b/annotations_filtered/0x05PrIasjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.96], [35.0, 90.0], [93.0, 95.71], [96.0, 98.63]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 30.38, 34.26], "audiomae_on_audioset": [null, null, [["music", 58.07], ["hum", 4.07], ["musical instrument", 3.21]], [["hum", 28.53], ["mains hum", 23.59], ["music", 19.73]]], "duration": [1.96, 55.0, 2.71, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/0x6usdVsGbI_filtered.json b/annotations_filtered/0x6usdVsGbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10b5d2910f986a42e3bc6886182e019ee8b150e6 --- /dev/null +++ b/annotations_filtered/0x6usdVsGbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 30.0], [35.0, 48.51], [53.0, 52.95], [64.0, 64.4], [75.0, 78.14], [85.0, 86.19]], "keep_status": [true, false, false, false, true, false], "silence_prob": [38.74, 31.88, 0.0, 0.0, 37.27, 0.0], "audiomae_on_audioset": [[["sonar", 18.36], ["tick", 9.86], ["hum", 8.32]], [["speech", 71.44], ["hum", 6.85], ["mains hum", 4.57]], null, null, [["speech", 62.78], ["music", 4.77], ["sidetone", 2.11]], null], "duration": [24.0, 13.51, -0.05, 0.4, 3.14, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/0xHe1zkABYo_filtered.json b/annotations_filtered/0xHe1zkABYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e8d33f60be399cf1d5bb769860c483e82c972db --- /dev/null +++ b/annotations_filtered/0xHe1zkABYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 25.79], [34.0, 34.7], [36.0, 38.16], [39.0, 40.53], [44.0, 60.66], [62.0, 63.09], [64.0, 65.45], [67.0, 67.42], [70.0, 72.33], [74.0, 75.27], [77.0, 77.94], [80.0, 80.18], [83.0, 85.36], [88.0, 92.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 0.0, 99.97, 0.0, 40.4, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 97.73, 81.35], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 36.83], ["hum", 29.55], ["buzz", 7.93]], null, null, null, null, null, null, null, null, null], "duration": [18.79, 0.7, 2.16, 1.53, 16.66, 1.09, 1.45, 0.42, 2.33, 1.27, 0.94, 0.18, 2.36, 4.94]} \ No newline at end of file diff --git a/annotations_filtered/0xJcu3vc9tI_filtered.json b/annotations_filtered/0xJcu3vc9tI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..683cf0d6c7f02017b45af4b0df0d6c5fa59016c9 --- /dev/null +++ b/annotations_filtered/0xJcu3vc9tI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 47.68], [50.0, 51.58], [53.0, 54.04], [55.0, 56.32], [58.0, 59.7], [62.0, 62.78], [64.0, 65.92], [68.0, 69.4], [71.0, 72.15], [74.0, 74.68], [75.0, 76.65], [79.0, 80.15], [81.0, 82.11], [84.0, 84.59], [87.0, 93.06], [95.0, 103.1], [105.0, 107.52], [109.0, 111.59], [114.0, 115.3], [117.0, 138.52], [140.0, 141.67], [143.0, 146.15], [148.0, 148.46], [153.0, 158.28], [159.0, 161.03], [162.0, 163.86], [165.0, 165.01], [168.0, 169.7], [171.0, 173.74], [175.0, 176.77], [178.0, 179.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 76.86, 100.0, 100.0, 0.0, 34.69, 0.0, 54.7, 0.0, 64.52, 73.06, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.65], ["hum", 16.18], ["mains hum", 12.25]], null, null, null, null, null, null, null, null, null, null, null], "duration": [34.68, 1.58, 1.04, 1.32, 1.7, 0.78, 1.92, 1.4, 1.15, 0.68, 1.65, 1.15, 1.11, 0.59, 6.06, 8.1, 2.52, 2.59, 1.3, 21.52, 1.67, 3.15, 0.46, 5.28, 2.03, 1.86, 0.01, 1.7, 2.74, 1.77, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/0xSSnfRYBQY_filtered.json b/annotations_filtered/0xSSnfRYBQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1611ed721edf2ad5afe21a9e1d5285d7ab62c1c4 --- /dev/null +++ b/annotations_filtered/0xSSnfRYBQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 29.57], [30.0, 33.52], [34.0, 36.86], [37.0, 38.84], [39.0, 41.32], [42.0, 45.86], [47.0, 50.65], [51.0, 53.59]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [29.73, 30.05, 30.11, 0.0, 30.15, 30.15, 30.19, 30.29], "audiomae_on_audioset": [[["hum", 32.01], ["music", 21.09], ["throbbing", 16.49]], [["throbbing", 43.13], ["music", 29.5], ["hum", 8.59]], [["throbbing", 28.1], ["music", 25.03], ["hum", 18.3]], null, [["music", 40.23], ["throbbing", 15.06], ["speech", 11.03]], [["music", 33.76], ["throbbing", 28.29], ["hum", 16.14]], [["music", 54.02], ["throbbing", 16.54], ["hum", 8.92]], [["music", 56.71], ["electronic music", 9.4], ["throbbing", 8.99]]], "duration": [6.57, 3.52, 2.86, 1.84, 2.32, 3.86, 3.65, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/0xWMqsZOYWg_filtered.json b/annotations_filtered/0xWMqsZOYWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..608920b4a0441a91c586801c10fe0fd5aa86f051 --- /dev/null +++ b/annotations_filtered/0xWMqsZOYWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.22], [27.0, 41.99], [51.0, 62.19], [69.0, 74.71], [79.0, 81.55], [82.0, 84.13], [85.0, 87.37], [90.0, 96.06], [101.0, 102.46], [106.0, 105.9], [106.0, 108.84], [113.0, 114.15], [115.0, 125.09]], "keep_status": [true, true, false, false, true, true, true, true, false, false, true, false, true], "silence_prob": [36.53, 34.07, 34.37, 32.56, 42.02, 31.14, 31.35, 32.08, 0.0, 0.0, 35.68, 0.0, 30.14], "audiomae_on_audioset": [[["thunk", 37.97], ["hum", 12.16], ["mains hum", 6.41]], [["music", 37.85], ["animal", 23.4], ["dog", 7.34]], [["music", 62.38], ["didgeridoo", 9.01], ["musical instrument", 4.67]], [["speech", 49.11], ["music", 30.79], ["theremin", 4.58]], [["music", 32.55], ["civil defense siren", 14.08], ["hum", 5.78]], [["music", 45.86], ["speech", 15.05], ["didgeridoo", 4.28]], [["music", 41.76], ["musical instrument", 9.16], ["guitar", 7.31]], [["music", 35.15], ["trombone", 14.7], ["speech", 13.64]], null, null, [["music", 42.55], ["synthesizer", 9.53], ["didgeridoo", 6.67]], null, [["music", 27.28], ["noise", 15.33], ["didgeridoo", 11.58]]], "duration": [2.22, 14.99, 11.19, 5.71, 2.55, 2.13, 2.37, 6.06, 1.46, -0.1, 2.84, 1.15, 10.09]} \ No newline at end of file diff --git a/annotations_filtered/0xjYQiEDbj4_filtered.json b/annotations_filtered/0xjYQiEDbj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b6f1fd77abb759670f88a4c5ea1c064214151e1 --- /dev/null +++ b/annotations_filtered/0xjYQiEDbj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [5.0, 5.58], [11.0, 11.7], [14.0, 17.64], [19.0, 21.02], [25.0, 25.19], [29.0, 29.79], [32.0, 32.66], [37.0, 41.72], [45.0, 52.14], [53.0, 55.49], [59.0, 61.4], [62.0, 63.93], [66.0, 67.39], [68.0, 70.5], [72.0, 73.13], [74.0, 76.27], [78.0, 77.99], [78.0, 79.12], [83.0, 111.75], [115.0, 115.99], [118.0, 120.88], [122.0, 121.98], [122.0, 122.01], [122.0, 126.12], [134.0, 145.61], [147.0, 150.87], [153.0, 162.41], [163.0, 164.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.82, 98.19, 0.0, 0.0, 0.0, 53.91, 100.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 98.93, 0.0, 0.0, 72.6, 0.0, 99.99, 0.0, 0.0, 85.35, 99.99, 100.0, 94.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.58, 0.7, 3.64, 2.02, 0.19, 0.79, 0.66, 4.72, 7.14, 2.49, 2.4, 1.93, 1.39, 2.5, 1.13, 2.27, -0.01, 1.12, 28.75, 0.99, 2.88, -0.02, 0.01, 4.12, 11.61, 3.87, 9.41, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/0y5KiKKCD7A_filtered.json b/annotations_filtered/0y5KiKKCD7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56d3fd684c38a8bd97b5b83a240d54ed5009fa07 --- /dev/null +++ b/annotations_filtered/0y5KiKKCD7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.03], [27.0, 27.72], [29.0, 31.18], [35.0, 40.02], [40.0, 41.82], [45.0, 57.32], [59.0, 61.67], [65.0, 68.61], [74.0, 77.23], [78.0, 80.86], [83.0, 192.23]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false], "silence_prob": [28.26, 0.0, 37.25, 29.02, 0.0, 29.2, 41.28, 39.43, 28.98, 28.44, 0.0], "audiomae_on_audioset": [[["throbbing", 33.6], ["hum", 30.16], ["music", 14.97]], null, [["music", 28.3], ["hum", 11.45], ["speech", 10.69]], [["hum", 25.87], ["music", 25.56], ["throbbing", 17.19]], null, [["speech", 56.47], ["music", 22.01], ["electronic music", 4.01]], [["music", 42.44], ["synthesizer", 6.41], ["didgeridoo", 5.59]], [["music", 40.83], ["theremin", 27.66], ["didgeridoo", 5.23]], [["music", 56.52], ["scary music", 10.33], ["throbbing", 5.91]], [["speech", 36.79], ["gong", 28.61], ["music", 5.53]], null], "duration": [8.03, 0.72, 2.18, 5.02, 1.82, 12.32, 2.67, 3.61, 3.23, 2.86, 109.23]} \ No newline at end of file diff --git a/annotations_filtered/0yAYgv2YQ5k_filtered.json b/annotations_filtered/0yAYgv2YQ5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..171a1f228d613569e66d58f743f8ba924811988d --- /dev/null +++ b/annotations_filtered/0yAYgv2YQ5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.24], [23.0, 24.43], [27.0, 29.22], [31.0, 48.98], [52.0, 64.07]], "keep_status": [false, false, true, true, true], "silence_prob": [0.0, 0.0, 29.91, 29.0, 28.63], "audiomae_on_audioset": [null, null, [["groan", 17.06], ["sound effect", 14.33], ["whack, thwack", 12.03]], [["screaming", 27.82], ["music", 22.22], ["speech", 5.78]], [["speech", 36.78], ["whack, thwack", 18.17], ["thunk", 6.8]]], "duration": [0.24, 1.43, 2.22, 17.98, 12.07]} \ No newline at end of file diff --git a/annotations_filtered/0yDzNGZc9DI_filtered.json b/annotations_filtered/0yDzNGZc9DI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4810f0d32864746a95e76e4ecb08ef269c258d41 --- /dev/null +++ b/annotations_filtered/0yDzNGZc9DI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.64], [11.0, 52.69], [57.0, 63.07], [66.0, 107.27], [110.0, 121.1]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.86, 0.0, 35.38], "audiomae_on_audioset": [null, null, [["speech", 47.72], ["music", 39.94], ["whale vocalization", 2.75]], null, [["whale vocalization", 14.98], ["noise", 11.62], ["livestock, farm animals, working animals", 10.98]]], "duration": [-0.36, 41.69, 6.07, 41.27, 11.1]} \ No newline at end of file diff --git a/annotations_filtered/0yOwWkbamyM_filtered.json b/annotations_filtered/0yOwWkbamyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e59bbbd9e83205038b33e21b7b7c5a84d5126ab5 --- /dev/null +++ b/annotations_filtered/0yOwWkbamyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 40.71], [41.0, 40.9], [41.0, 41.0], [41.0, 41.45], [47.0, 46.68], [48.0, 48.39], [87.0, 93.8], [96.0, 101.93], [103.0, 124.01], [133.0, 133.05], [162.0, 165.55], [169.0, 175.46], [175.0, 175.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.53, 30.84, 30.7, 0.0, 31.16, 36.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 87.17], ["didgeridoo", 3.04], ["electronic music", 1.32]], [["music", 84.87], ["musical instrument", 3.49], ["didgeridoo", 2.15]], [["music", 92.19], ["drum machine", 2.97], ["electronic music", 1.59]], null, [["music", 53.67], ["didgeridoo", 10.43], ["speech", 7.08]], [["music", 58.97], ["speech", 7.89], ["sidetone", 7.86]], null], "duration": [33.71, -0.1, 0.0, 0.45, -0.32, 0.39, 6.8, 5.93, 21.01, 0.05, 3.55, 6.46, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/0yYUlLFlw1I_filtered.json b/annotations_filtered/0yYUlLFlw1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d6a6f20a524c0b96764078dda02a6928dc25e23 --- /dev/null +++ b/annotations_filtered/0yYUlLFlw1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.1], [15.0, 16.56], [18.0, 22.01], [22.0, 24.73], [25.0, 26.64], [28.0, 30.72], [34.0, 37.05], [67.0, 66.9], [84.0, 86.88], [87.0, 94.88], [100.0, 103.27], [107.0, 108.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.99, 0.0, 99.59, 89.36, 0.0, 54.97, 94.95, 0.0, 100.0, 58.3, 98.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.1, 1.56, 4.01, 2.73, 1.64, 2.72, 3.05, -0.1, 2.88, 7.88, 3.27, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/0yc0knpkAxw_filtered.json b/annotations_filtered/0yc0knpkAxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77f9cfec97ae4082002ce50717cfc7fc259ec0d4 --- /dev/null +++ b/annotations_filtered/0yc0knpkAxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [1.0, 3.32], [4.0, 34.32], [37.0, 38.53], [41.0, 42.09], [44.0, 44.76], [50.0, 82.31], [83.0, 84.84], [88.0, 102.34], [103.0, 102.59], [103.0, 108.45], [114.0, 115.86], [117.0, 119.47], [123.0, 124.38]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 54.76, 0.0, 90.95, 0.0], "audiomae_on_audioset": [null, [["frog", 22.25], ["mosquito", 10.65], ["music", 10.34]], null, null, null, null, null, null, [["speech", 58.19], ["music", 14.15], ["hum", 6.7]], null, null, null, null, null], "duration": [0.65, 2.32, 30.32, 1.53, 1.09, 0.76, 32.31, 1.84, 14.34, -0.41, 5.45, 1.86, 2.47, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/0yngsYrBCLg_filtered.json b/annotations_filtered/0yngsYrBCLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99140df6fd7aada5cb6d14b3c6599210235ba977 --- /dev/null +++ b/annotations_filtered/0yngsYrBCLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [15.0, 15.42], [17.0, 18.52], [52.0, 51.76], [53.0, 53.87], [58.0, 58.01], [61.0, 61.28], [61.0, 61.33]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.32, 0.42, 1.52, -0.24, 0.87, 0.01, 0.28, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/0z-FtAMg6Vw_filtered.json b/annotations_filtered/0z-FtAMg6Vw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a314a004e271c3a8c869a55342ea9ec2774d8762 --- /dev/null +++ b/annotations_filtered/0z-FtAMg6Vw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.43], [6.0, 7.01], [9.0, 9.73], [18.0, 18.64], [19.0, 20.24], [22.0, 23.85], [24.0, 33.17], [38.0, 47.9]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.41, 36.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 58.6], ["musical instrument", 10.5], ["echo", 5.22]], [["music", 36.3], ["noise", 21.02], ["effects unit", 13.63]]], "duration": [1.43, 1.01, 0.73, 0.64, 1.24, 1.85, 9.17, 9.9]} \ No newline at end of file diff --git a/annotations_filtered/0z9b9_n8-Ek_filtered.json b/annotations_filtered/0z9b9_n8-Ek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..286c7414fbd92970550111f566a0df38a73b1467 --- /dev/null +++ b/annotations_filtered/0z9b9_n8-Ek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 50.58], [51.0, 59.14], [60.0, 65.79], [66.0, 68.66], [69.0, 74.63], [75.0, 84.21], [85.0, 86.1], [88.0, 89.97], [92.0, 105.24], [107.0, 113.31], [114.0, 121.32], [122.0, 133.44], [136.0, 136.85]], "keep_status": [false, true, true, false, false, true, false, false, true, false, true, true, false], "silence_prob": [45.46, 40.12, 46.12, 56.25, 56.25, 43.53, 0.0, 0.0, 42.53, 52.27, 34.37, 30.0, 0.0], "audiomae_on_audioset": [[["insect", 45.18], ["fly, housefly", 30.16], ["bee, wasp, etc.", 17.48]], [["speech", 28.43], ["hum", 11.0], ["noise", 7.7]], [["sidetone", 19.39], ["noise", 12.21], ["whale vocalization", 9.51]], null, null, [["fly, housefly", 34.05], ["insect", 16.29], ["bee, wasp, etc.", 14.61]], null, null, [["hum", 36.93], ["animal", 25.32], ["mains hum", 5.61]], null, [["hum", 23.38], ["bee, wasp, etc.", 16.86], ["speech", 7.31]], [["speech", 40.55], ["hum", 12.49], ["mains hum", 11.38]], null], "duration": [2.58, 8.14, 5.79, 2.66, 5.63, 9.21, 1.1, 1.97, 13.24, 6.31, 7.32, 11.44, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/0zHERbRFxTU_filtered.json b/annotations_filtered/0zHERbRFxTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a79c027c08e424d8aa1ed67c79cc56c9fb355b3c --- /dev/null +++ b/annotations_filtered/0zHERbRFxTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.57], [31.0, 31.94], [35.0, 35.11], [36.0, 41.17], [42.0, 42.79], [45.0, 49.47], [52.0, 54.04], [57.0, 62.97], [63.0, 63.81], [64.0, 64.25], [66.0, 71.15], [77.0, 77.41], [85.0, 85.77], [88.0, 88.5], [89.0, 88.75], [94.0, 97.73], [106.0, 106.96], [111.0, 112.83], [115.0, 126.89], [127.0, 129.17], [139.0, 140.98], [144.0, 147.6]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.95, 0.0, 32.18, 35.68, 42.22, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 36.54, 38.86, 0.0, 31.86], "audiomae_on_audioset": [null, null, null, [["music", 53.84], ["speech", 23.22], ["boing", 5.3]], null, [["cattle, bovinae", 22.1], ["livestock, farm animals, working animals", 18.73], ["moo", 16.35]], [["music", 44.2], ["musical instrument", 10.56], ["guitar", 8.43]], [["speech", 80.27], ["animal", 2.6], ["outside, rural or natural", 1.95]], null, null, null, null, null, null, null, [["music", 49.68], ["speech", 18.33], ["boing", 7.06]], null, null, [["whale vocalization", 77.72], ["music", 11.8], ["animal", 2.35]], [["music", 66.31], ["musical instrument", 4.98], ["guitar", 4.25]], null, [["whale vocalization", 89.01], ["speech", 2.66], ["animal", 1.04]]], "duration": [1.57, 0.94, 0.11, 5.17, 0.79, 4.47, 2.04, 5.97, 0.81, 0.25, 5.15, 0.41, 0.77, 0.5, -0.25, 3.73, 0.96, 1.83, 11.89, 2.17, 1.98, 3.6]} \ No newline at end of file diff --git a/annotations_filtered/0zHmeTeLgMY_filtered.json b/annotations_filtered/0zHmeTeLgMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a3584fd7c802e95f27eefd5d7c47dcb6ebf6164 --- /dev/null +++ b/annotations_filtered/0zHmeTeLgMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.41], [21.0, 122.52], [126.0, 128.71], [140.0, 141.3], [148.0, 150.82], [166.0, 167.7], [168.0, 173.01], [174.0, 177.69]], "keep_status": [false, false, true, false, true, false, false, false], "silence_prob": [100.0, 0.0, 41.36, 0.0, 36.2, 0.0, 70.72, 59.51], "audiomae_on_audioset": [null, null, [["music", 29.58], ["theremin", 7.04], ["hum", 3.79]], null, [["music", 42.64], ["didgeridoo", 20.12], ["speech", 6.59]], null, null, null], "duration": [6.41, 101.52, 2.71, 1.3, 2.82, 1.7, 5.01, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/0zImze5PCFg_filtered.json b/annotations_filtered/0zImze5PCFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d51c9a9256e21cb019a47cb2bdc872c2acec641 --- /dev/null +++ b/annotations_filtered/0zImze5PCFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.06], [12.0, 12.45], [20.0, 20.66], [24.0, 26.77], [27.0, 27.46], [29.0, 29.3], [33.0, 33.0], [36.0, 36.73], [38.0, 38.25], [39.0, 39.83], [46.0, 46.63], [49.0, 48.91], [58.0, 58.24], [59.0, 66.39], [70.0, 69.74], [78.0, 78.36], [81.0, 81.26], [82.0, 83.84], [86.0, 88.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 87.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.45, 0.66, 2.77, 0.46, 0.3, 0.0, 0.73, 0.25, 0.83, 0.63, -0.09, 0.24, 7.39, -0.26, 0.36, 0.26, 1.84, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/0zJpr-bB1sg_filtered.json b/annotations_filtered/0zJpr-bB1sg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7395eb6752608ac29475ca8843b220de64e71c71 --- /dev/null +++ b/annotations_filtered/0zJpr-bB1sg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.39], [12.0, 21.93], [22.0, 37.08], [39.0, 40.47], [43.0, 59.81], [69.0, 79.84], [82.0, 81.95], [83.0, 118.32], [121.0, 122.76], [129.0, 129.73], [134.0, 150.74], [152.0, 174.78]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, true], "silence_prob": [38.47, 32.64, 33.84, 0.0, 36.95, 32.16, 0.0, 0.0, 0.0, 0.0, 30.97, 30.94], "audiomae_on_audioset": [[["speech", 39.38], ["music", 36.84], ["musical instrument", 3.36]], [["speech", 64.31], ["music", 17.92], ["sidetone", 2.66]], [["music", 41.75], ["hum", 11.33], ["didgeridoo", 7.21]], null, [["music", 26.52], ["throbbing", 24.52], ["hum", 22.1]], [["music", 17.49], ["vehicle", 9.99], ["car", 5.42]], null, null, null, null, [["music", 44.8], ["speech", 10.72], ["mains hum", 7.13]], [["explosion", 29.22], ["music", 11.78], ["hum", 9.42]]], "duration": [5.39, 9.93, 15.08, 1.47, 16.81, 10.84, -0.05, 35.32, 1.76, 0.73, 16.74, 22.78]} \ No newline at end of file diff --git a/annotations_filtered/0zLL_XdqxmQ_filtered.json b/annotations_filtered/0zLL_XdqxmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95f7c07436906c064410b998b5c06b30a09ba54e --- /dev/null +++ b/annotations_filtered/0zLL_XdqxmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.55], [17.0, 25.22], [26.0, 27.41], [29.0, 29.62], [31.0, 33.13], [34.0, 37.57], [39.0, 42.5], [46.0, 47.02], [50.0, 49.84], [52.0, 52.32], [54.0, 53.89], [58.0, 60.12], [61.0, 62.18], [62.0, 63.44], [66.0, 68.55], [71.0, 72.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.82, 63.53, 0.0, 0.0, 65.55, 68.28, 71.57, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 59.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.55, 8.22, 1.41, 0.62, 2.13, 3.57, 3.5, 1.02, -0.16, 0.32, -0.11, 2.12, 1.18, 1.44, 2.55, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/0zQAUQGwv4A_filtered.json b/annotations_filtered/0zQAUQGwv4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..227910dbb97dc1fa9895db66fd4d37388b7a76af --- /dev/null +++ b/annotations_filtered/0zQAUQGwv4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [5.0, 6.02], [6.0, 6.69], [12.0, 13.86], [15.0, 16.83], [18.0, 21.88], [23.0, 23.77], [25.0, 26.4], [27.0, 30.91], [32.0, 32.93], [41.0, 42.63], [43.0, 44.73], [46.0, 46.5], [47.0, 48.86], [50.0, 50.08], [51.0, 51.12], [57.0, 57.67], [58.0, 58.95], [60.0, 60.74], [61.0, 61.75], [62.0, 64.61], [70.0, 70.02], [70.0, 73.77], [75.0, 75.07], [79.0, 80.84], [82.0, 86.07], [90.0, 92.89], [96.0, 100.16], [102.0, 108.58], [112.0, 113.09], [114.0, 114.51], [119.0, 119.94], [121.0, 121.9], [124.0, 124.61], [127.0, 127.67], [130.0, 129.86], [134.0, 135.78], [136.0, 137.89], [138.0, 140.75], [141.0, 154.26], [155.0, 165.74], [167.0, 168.17], [169.0, 175.02], [176.0, 178.75]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [59.51, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 55.31, 0.0, 0.0, 37.96, 36.47, 32.42, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 42.91, 32.03, 0.0, 47.31, 34.28], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.26], ["theremin", 22.9], ["wind instrument, woodwind instrument", 3.48]], null, null, [["music", 18.93], ["foghorn", 11.94], ["gong", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 45.88], ["mains hum", 15.01], ["music", 13.17]], [["music", 47.61], ["synthesizer", 8.35], ["hum", 4.93]], [["music", 57.66], ["cowbell", 3.58], ["cacophony", 3.22]], [["music", 83.22], ["synthesizer", 6.52], ["electronic music", 2.43]], null, null, null, null, null, null, null, null, null, null, [["music", 46.34], ["theremin", 29.66], ["whale vocalization", 2.17]], [["theremin", 71.7], ["music", 23.88], ["musical instrument", 1.72]], null, [["music", 42.52], ["theremin", 11.02], ["flute", 5.06]], [["trombone", 28.63], ["music", 23.37], ["brass instrument", 21.01]]], "duration": [2.16, 1.02, 0.69, 1.86, 1.83, 3.88, 0.77, 1.4, 3.91, 0.93, 1.63, 1.73, 0.5, 1.86, 0.08, 0.12, 0.67, 0.95, 0.74, 0.75, 2.61, 0.02, 3.77, 0.07, 1.84, 4.07, 2.89, 4.16, 6.58, 1.09, 0.51, 0.94, 0.9, 0.61, 0.67, -0.14, 1.78, 1.89, 2.75, 13.26, 10.74, 1.17, 6.02, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/0zROMB5cxBA_filtered.json b/annotations_filtered/0zROMB5cxBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41170e25cd8ea0c174326a646498a768ae176e7f --- /dev/null +++ b/annotations_filtered/0zROMB5cxBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.77], [14.0, 14.67], [20.0, 21.61], [23.0, 23.72], [25.0, 25.54], [26.0, 26.42], [28.0, 27.85], [29.0, 28.88], [29.0, 30.11], [31.0, 31.99], [33.0, 33.45], [37.0, 37.56], [40.0, 39.65], [41.0, 42.48], [43.0, 43.56], [44.0, 44.1], [45.0, 45.23], [46.0, 45.96], [46.0, 46.45], [47.0, 49.64], [50.0, 51.06], [52.0, 52.34], [54.0, 54.75], [55.0, 55.7], [59.0, 59.76], [61.0, 61.52], [63.0, 62.88], [66.0, 66.97], [68.0, 68.52], [70.0, 70.77], [76.0, 76.5], [81.0, 81.6], [83.0, 84.03], [90.0, 89.77], [91.0, 91.29], [94.0, 95.52], [100.0, 100.48], [110.0, 112.01], [113.0, 114.29], [116.0, 119.55], [121.0, 121.46], [123.0, 123.67], [125.0, 125.91], [126.0, 126.77], [129.0, 131.11], [133.0, 132.95], [133.0, 137.4], [139.0, 143.01], [145.0, 150.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 99.26, 84.98, 98.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.67, 1.61, 0.72, 0.54, 0.42, -0.15, -0.12, 1.11, 0.99, 0.45, 0.56, -0.35, 1.48, 0.56, 0.1, 0.23, -0.04, 0.45, 2.64, 1.06, 0.34, 0.75, 0.7, 0.76, 0.52, -0.12, 0.97, 0.52, 0.77, 0.5, 0.6, 1.03, -0.23, 0.29, 1.52, 0.48, 2.01, 1.29, 3.55, 0.46, 0.67, 0.91, 0.77, 2.11, -0.05, 4.4, 4.01, 5.96]} \ No newline at end of file diff --git a/annotations_filtered/0zgTcrZ5030_filtered.json b/annotations_filtered/0zgTcrZ5030_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4bf6d1fe8f9d801a2838063ee1e7e94c12f5e19 --- /dev/null +++ b/annotations_filtered/0zgTcrZ5030_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.67], [19.0, 19.23], [23.0, 24.31], [25.0, 26.62], [39.0, 39.09], [41.0, 41.71], [42.0, 42.92], [43.0, 44.04], [45.0, 46.65], [49.0, 49.59], [63.0, 67.37], [68.0, 69.4], [70.0, 71.12], [72.0, 75.93], [77.0, 77.87], [83.0, 83.34], [84.0, 85.29], [88.0, 88.23], [90.0, 90.51], [92.0, 92.4], [93.0, 93.28], [95.0, 95.61], [98.0, 99.57], [107.0, 107.18], [113.0, 113.05], [118.0, 118.2], [119.0, 119.23], [120.0, 122.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 0.23, 1.31, 1.62, 0.09, 0.71, 0.92, 1.04, 1.65, 0.59, 4.37, 1.4, 1.12, 3.93, 0.87, 0.34, 1.29, 0.23, 0.51, 0.4, 0.28, 0.61, 1.57, 0.18, 0.05, 0.2, 0.23, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/0zhatVdxShE_filtered.json b/annotations_filtered/0zhatVdxShE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6c27ed36f3e9c32f27265baa593c3c49753230a --- /dev/null +++ b/annotations_filtered/0zhatVdxShE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.29], [6.0, 6.08], [27.0, 28.48], [36.0, 38.15], [41.0, 41.66], [48.0, 47.98], [51.0, 52.83], [53.0, 73.67], [74.0, 74.76], [75.0, 76.92], [80.0, 83.17], [84.0, 84.48], [85.0, 87.13], [90.0, 90.42], [95.0, 95.59], [97.0, 101.22], [102.0, 103.79], [107.0, 108.13], [110.0, 120.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 81.35, 0.0, 97.64, 0.0, 0.0, 89.72, 0.0, 0.0, 73.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.29, 0.08, 1.48, 2.15, 0.66, -0.02, 1.83, 20.67, 0.76, 1.92, 3.17, 0.48, 2.13, 0.42, 0.59, 4.22, 1.79, 1.13, 10.68]} \ No newline at end of file diff --git a/annotations_filtered/0zsUFpPjt8g_filtered.json b/annotations_filtered/0zsUFpPjt8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70698f2df0d1ef0133a30887aaae3d4be1e9258c --- /dev/null +++ b/annotations_filtered/0zsUFpPjt8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.19], [15.0, 15.92], [19.0, 19.75], [20.0, 21.68], [23.0, 24.07], [25.0, 30.11], [32.0, 33.51], [34.0, 35.45], [36.0, 36.91], [39.0, 40.19], [41.0, 41.5], [42.0, 43.11], [51.0, 51.02], [55.0, 56.17], [58.0, 62.51], [63.0, 64.22], [64.0, 67.9], [84.0, 85.92], [86.0, 87.13], [90.0, 93.82], [96.0, 96.08], [97.0, 97.21], [99.0, 102.29], [117.0, 122.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [40.61, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 50.11, 0.0, 0.0, 65.67, 0.0, 0.0, 45.52, 38.51], "audiomae_on_audioset": [[["music", 35.11], ["throbbing", 20.5], ["speech", 17.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.36], ["music", 14.08], ["speech", 9.02]], [["hum", 31.93], ["mains hum", 23.0], ["music", 10.99]]], "duration": [3.19, 0.92, 0.75, 1.68, 1.07, 5.11, 1.51, 1.45, 0.91, 1.19, 0.5, 1.11, 0.02, 1.17, 4.51, 1.22, 3.9, 1.92, 1.13, 3.82, 0.08, 0.21, 3.29, 5.67]} \ No newline at end of file diff --git a/annotations_filtered/0zuW4KMG7XQ_filtered.json b/annotations_filtered/0zuW4KMG7XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27d3d14eb16485ad3b0b57bd53c072f84635301 --- /dev/null +++ b/annotations_filtered/0zuW4KMG7XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [8.0, 10.77], [11.0, 12.5], [13.0, 13.17], [14.0, 15.94], [17.0, 16.9], [25.0, 25.84], [28.0, 28.26], [29.0, 30.86], [40.0, 41.84], [47.0, 48.49], [50.0, 50.33], [51.0, 51.44], [59.0, 59.26], [63.0, 63.69], [67.0, 67.27], [72.0, 72.99], [74.0, 76.37], [78.0, 79.91], [81.0, 82.31], [83.0, 83.79], [95.0, 95.45], [124.0, 125.58], [132.0, 141.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 39.61], "audiomae_on_audioset": [null, [["music", 62.81], ["throbbing", 5.69], ["video game music", 4.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 16.96], ["groan", 14.17], ["wail, moan", 10.68]]], "duration": [-0.09, 2.77, 1.5, 0.17, 1.94, -0.1, 0.84, 0.26, 1.86, 1.84, 1.49, 0.33, 0.44, 0.26, 0.69, 0.27, 0.99, 2.37, 1.91, 1.31, 0.79, 0.45, 1.58, 9.08]} \ No newline at end of file